VideoCommon: cache the per-vertex position/normal matrix index

This commit is contained in:
Tillmann Karras 2024-12-16 00:56:10 +00:00
parent f9ce2b9d76
commit 3701c0234e
8 changed files with 36 additions and 73 deletions

View File

@ -70,7 +70,6 @@ struct alignas(16) VertexShaderConstants
u32 missing_color_hex; // .w, used for change detection but not directly by shaders u32 missing_color_hex; // .w, used for change detection but not directly by shaders
float4 missing_color_value; float4 missing_color_value;
std::array<float4, 6> posnormalmatrix;
std::array<float4, 4> projection; std::array<float4, 4> projection;
std::array<int4, 4> materials; std::array<int4, 4> materials;
struct Light struct Light
@ -93,6 +92,8 @@ struct alignas(16) VertexShaderConstants
// .x - texMtxInfo, .y - postMtxInfo, [0..1].z = color, [0..1].w = alpha // .x - texMtxInfo, .y - postMtxInfo, [0..1].z = color, [0..1].w = alpha
std::array<uint4, 8> xfmem_pack1; std::array<uint4, 8> xfmem_pack1;
// TODO: only first element is currently used
std::array<u32, 4> cached_posmtxidx;
float4 cached_normal; float4 cached_normal;
float4 cached_tangent; float4 cached_tangent;
float4 cached_binormal; float4 cached_binormal;

View File

@ -273,7 +273,6 @@ void WriteSwitch(ShaderCode& out, APIType ApiType, std::string_view variable,
#define I_ZSLOPE "czslope" #define I_ZSLOPE "czslope"
#define I_EFBSCALE "cefbscale" #define I_EFBSCALE "cefbscale"
#define I_POSNORMALMATRIX "cpnmtx"
#define I_PROJECTION "cproj" #define I_PROJECTION "cproj"
#define I_MATERIALS "cmtrl" #define I_MATERIALS "cmtrl"
#define I_LIGHTS "clights" #define I_LIGHTS "clights"
@ -283,6 +282,7 @@ void WriteSwitch(ShaderCode& out, APIType ApiType, std::string_view variable,
#define I_POSTTRANSFORMMATRICES "cpostmtx" #define I_POSTTRANSFORMMATRICES "cpostmtx"
#define I_PIXELCENTERCORRECTION "cpixelcenter" #define I_PIXELCENTERCORRECTION "cpixelcenter"
#define I_VIEWPORT_SIZE "cviewport" #define I_VIEWPORT_SIZE "cviewport"
#define I_CACHED_POSMTXIDX "cposmtxidx"
#define I_CACHED_NORMAL "cnormal" #define I_CACHED_NORMAL "cnormal"
#define I_CACHED_TANGENT "ctangent" #define I_CACHED_TANGENT "ctangent"
#define I_CACHED_BINORMAL "cbinormal" #define I_CACHED_BINORMAL "cbinormal"
@ -296,7 +296,6 @@ static const char s_shader_uniforms[] = "\tuint components;\n"
"\tuint xfmem_numColorChans;\n" "\tuint xfmem_numColorChans;\n"
"\tuint missing_color_hex;\n" "\tuint missing_color_hex;\n"
"\tfloat4 missing_color_value;\n" "\tfloat4 missing_color_value;\n"
"\tfloat4 " I_POSNORMALMATRIX "[6];\n"
"\tfloat4 " I_PROJECTION "[4];\n" "\tfloat4 " I_PROJECTION "[4];\n"
"\tint4 " I_MATERIALS "[4];\n" "\tint4 " I_MATERIALS "[4];\n"
"\tLight " I_LIGHTS "[8];\n" "\tLight " I_LIGHTS "[8];\n"
@ -307,6 +306,7 @@ static const char s_shader_uniforms[] = "\tuint components;\n"
"\tfloat4 " I_PIXELCENTERCORRECTION ";\n" "\tfloat4 " I_PIXELCENTERCORRECTION ";\n"
"\tfloat2 " I_VIEWPORT_SIZE ";\n" "\tfloat2 " I_VIEWPORT_SIZE ";\n"
"\tuint4 xfmem_pack1[8];\n" "\tuint4 xfmem_pack1[8];\n"
"\tuint4 " I_CACHED_POSMTXIDX ";\n"
"\tfloat4 " I_CACHED_NORMAL ";\n" "\tfloat4 " I_CACHED_NORMAL ";\n"
"\tfloat4 " I_CACHED_TANGENT ";\n" "\tfloat4 " I_CACHED_TANGENT ";\n"
"\tfloat4 " I_CACHED_BINORMAL ";\n" "\tfloat4 " I_CACHED_BINORMAL ";\n"

View File

@ -223,28 +223,23 @@ float3 load_input_float3_rawtex(uint vtx_offset, uint attr_offset) {{
"float3 N1;\n" "float3 N1;\n"
"float3 N2;\n" "float3 N2;\n"
"\n" "\n"
"uint posidx;\n"
"if ((components & {}u) != 0u) {{ // VB_HAS_POSMTXIDX\n", "if ((components & {}u) != 0u) {{ // VB_HAS_POSMTXIDX\n",
Common::ToUnderlying(VB_HAS_POSMTXIDX)); Common::ToUnderlying(VB_HAS_POSMTXIDX));
LoadVertexAttribute(out, host_config, 2, "posmtx", "uint4", "ubyte4"); LoadVertexAttribute(out, host_config, 2, "posmtx", "uint4", "ubyte4");
out.Write(" // Vertex format has a per-vertex matrix\n" out.Write(" // Vertex format has a per-vertex matrix\n"
" int posidx = int(posmtx.r);\n" " posidx = int(posmtx.r);\n"
"}} else {{\n"
" posidx = " I_CACHED_POSMTXIDX ".r;\n"
"}}\n"
"P0 = " I_TRANSFORMMATRICES "[posidx];\n" "P0 = " I_TRANSFORMMATRICES "[posidx];\n"
"P1 = " I_TRANSFORMMATRICES "[posidx+1];\n" "P1 = " I_TRANSFORMMATRICES "[posidx+1];\n"
"P2 = " I_TRANSFORMMATRICES "[posidx+2];\n" "P2 = " I_TRANSFORMMATRICES "[posidx+2];\n"
"\n" "\n"
" int normidx = posidx >= 32 ? (posidx - 32) : posidx;\n" "uint normidx = posidx >= 32 ? (posidx - 32) : posidx;\n"
"N0 = " I_NORMALMATRICES "[normidx].xyz;\n" "N0 = " I_NORMALMATRICES "[normidx].xyz;\n"
"N1 = " I_NORMALMATRICES "[normidx+1].xyz;\n" "N1 = " I_NORMALMATRICES "[normidx+1].xyz;\n"
"N2 = " I_NORMALMATRICES "[normidx+2].xyz;\n" "N2 = " I_NORMALMATRICES "[normidx+2].xyz;\n"
"}} else {{\n"
" // One shared matrix\n"
" P0 = " I_POSNORMALMATRIX "[0];\n"
" P1 = " I_POSNORMALMATRIX "[1];\n"
" P2 = " I_POSNORMALMATRIX "[2];\n"
" N0 = " I_POSNORMALMATRIX "[3].xyz;\n"
" N1 = " I_POSNORMALMATRIX "[4].xyz;\n"
" N2 = " I_POSNORMALMATRIX "[5].xyz;\n"
"}}\n"
"\n" "\n"
"// Multiply the position vector by the position matrix\n" "// Multiply the position vector by the position matrix\n"
"float4 pos = float4(dot(P0, rawpos), dot(P1, rawpos), dot(P2, rawpos), 1.0);\n" "float4 pos = float4(dot(P0, rawpos), dot(P1, rawpos), dot(P2, rawpos), 1.0);\n"

View File

@ -558,6 +558,13 @@ void VertexManagerBase::Flush()
pixel_shader_manager.constants.time_ms = seconds_elapsed * 1000; pixel_shader_manager.constants.time_ms = seconds_elapsed * 1000;
} }
if (VertexLoaderManager::GetCurrentVertexFormat()->GetVertexDeclaration().posmtx.enable)
{
u32 posmtx = VertexLoaderManager::position_matrix_index_cache[0];
u32 texmtx = xfmem.MatrixIndexA.Hex & 0xFFFF'FFC0;
xf_state_manager.SetTexMatrixChangedA(texmtx | posmtx);
xfmem.MatrixIndexA.PosNormalMtxIdx = posmtx;
}
CalculateNormals(VertexLoaderManager::GetCurrentVertexFormat()); CalculateNormals(VertexLoaderManager::GetCurrentVertexFormat());
// Calculate ZSlope for zfreeze // Calculate ZSlope for zfreeze
const auto used_textures = UsedTextures(); const auto used_textures = UsedTextures();

View File

@ -306,29 +306,25 @@ ShaderCode GenerateVertexShaderCode(APIType api_type, const ShaderHostConfig& ho
} }
// transforms // transforms
if ((uid_data->components & VB_HAS_POSMTXIDX) != 0) if (uid_data->components & VB_HAS_POSMTXIDX)
{ {
// Vertex format has a per-vertex matrix // per-vertex position/normal matrix index
out.Write("int posidx = int(posmtx.r);\n" out.Write("uint posidx = int(posmtx.r);\n");
"float4 P0 = " I_TRANSFORMMATRICES "[posidx];\n"
"float4 P1 = " I_TRANSFORMMATRICES "[posidx + 1];\n"
"float4 P2 = " I_TRANSFORMMATRICES "[posidx + 2];\n"
"int normidx = posidx & 31;\n"
"float3 N0 = " I_NORMALMATRICES "[normidx].xyz;\n"
"float3 N1 = " I_NORMALMATRICES "[normidx + 1].xyz;\n"
"float3 N2 = " I_NORMALMATRICES "[normidx + 2].xyz;\n");
} }
else else
{ {
// One shared matrix // shared position/normal matrix index
out.Write("float4 P0 = " I_POSNORMALMATRIX "[0];\n" out.Write("uint posidx = " I_CACHED_POSMTXIDX ".r;\n");
"float4 P1 = " I_POSNORMALMATRIX "[1];\n"
"float4 P2 = " I_POSNORMALMATRIX "[2];\n"
"float3 N0 = " I_POSNORMALMATRIX "[3].xyz;\n"
"float3 N1 = " I_POSNORMALMATRIX "[4].xyz;\n"
"float3 N2 = " I_POSNORMALMATRIX "[5].xyz;\n");
} }
out.Write("float4 P0 = " I_TRANSFORMMATRICES "[posidx];\n"
"float4 P1 = " I_TRANSFORMMATRICES "[posidx + 1];\n"
"float4 P2 = " I_TRANSFORMMATRICES "[posidx + 2];\n"
"uint normidx = posidx & 31;\n"
"float3 N0 = " I_NORMALMATRICES "[normidx].xyz;\n"
"float3 N1 = " I_NORMALMATRICES "[normidx + 1].xyz;\n"
"float3 N2 = " I_NORMALMATRICES "[normidx + 2].xyz;\n");
out.Write("// Multiply the position vector by the position matrix\n" out.Write("// Multiply the position vector by the position matrix\n"
"float4 pos = float4(dot(P0, rawpos), dot(P1, rawpos), dot(P2, rawpos), 1.0);\n"); "float4 pos = float4(dot(P0, rawpos), dot(P1, rawpos), dot(P2, rawpos), 1.0);\n");
if ((uid_data->components & VB_HAS_NORMAL) == 0) if ((uid_data->components & VB_HAS_NORMAL) == 0)

View File

@ -289,23 +289,10 @@ void VertexShaderManager::SetConstants(const std::vector<std::string>& textures,
} }
xf_state_manager.ResetMaterialChanges(); xf_state_manager.ResetMaterialChanges();
if (xf_state_manager.DidPosNormalChange())
{
xf_state_manager.ResetPosNormalChange();
const float* pos = &xfmem.posMatrices[g_main_cp_state.matrix_index_a.PosNormalMtxIdx * 4];
const float* norm =
&xfmem.normalMatrices[3 * (g_main_cp_state.matrix_index_a.PosNormalMtxIdx & 31)];
memcpy(constants.posnormalmatrix.data(), pos, 3 * sizeof(float4));
memcpy(constants.posnormalmatrix[3].data(), norm, 3 * sizeof(float));
memcpy(constants.posnormalmatrix[4].data(), norm + 3, 3 * sizeof(float));
memcpy(constants.posnormalmatrix[5].data(), norm + 6, 3 * sizeof(float));
dirty = true;
}
if (xf_state_manager.DidTexMatrixAChange()) if (xf_state_manager.DidTexMatrixAChange())
{ {
xf_state_manager.ResetTexMatrixAChange(); xf_state_manager.ResetTexMatrixAChange();
constants.cached_posmtxidx[0] = g_main_cp_state.matrix_index_a.PosNormalMtxIdx;
const std::array<const float*, 4> pos_matrix_ptrs{ const std::array<const float*, 4> pos_matrix_ptrs{
&xfmem.posMatrices[g_main_cp_state.matrix_index_a.Tex0MtxIdx * 4], &xfmem.posMatrices[g_main_cp_state.matrix_index_a.Tex0MtxIdx * 4],
&xfmem.posMatrices[g_main_cp_state.matrix_index_a.Tex1MtxIdx * 4], &xfmem.posMatrices[g_main_cp_state.matrix_index_a.Tex1MtxIdx * 4],

View File

@ -14,7 +14,6 @@ void XFStateManager::Init()
// Initialize state tracking variables // Initialize state tracking variables
ResetTexMatrixAChange(); ResetTexMatrixAChange();
ResetTexMatrixBChange(); ResetTexMatrixBChange();
ResetPosNormalChange();
ResetProjection(); ResetProjection();
ResetViewportChange(); ResetViewportChange();
ResetTexMatrixInfoChange(); ResetTexMatrixInfoChange();
@ -37,7 +36,6 @@ void XFStateManager::DoState(PointerWrap& p)
p.Do(m_materials_changed); p.Do(m_materials_changed);
p.DoArray(m_tex_matrices_changed); p.DoArray(m_tex_matrices_changed);
p.Do(m_pos_normal_matrix_changed);
p.Do(m_projection_changed); p.Do(m_projection_changed);
p.Do(m_viewport_changed); p.Do(m_viewport_changed);
p.Do(m_tex_mtx_info_changed); p.Do(m_tex_mtx_info_changed);
@ -53,16 +51,6 @@ void XFStateManager::DoState(PointerWrap& p)
void XFStateManager::InvalidateXFRange(int start, int end) void XFStateManager::InvalidateXFRange(int start, int end)
{ {
if (((u32)start >= (u32)g_main_cp_state.matrix_index_a.PosNormalMtxIdx * 4 &&
(u32)start < (u32)g_main_cp_state.matrix_index_a.PosNormalMtxIdx * 4 + 12) ||
((u32)start >=
XFMEM_NORMALMATRICES + ((u32)g_main_cp_state.matrix_index_a.PosNormalMtxIdx & 31) * 3 &&
(u32)start < XFMEM_NORMALMATRICES +
((u32)g_main_cp_state.matrix_index_a.PosNormalMtxIdx & 31) * 3 + 9))
{
m_pos_normal_matrix_changed = true;
}
if (((u32)start >= (u32)g_main_cp_state.matrix_index_a.Tex0MtxIdx * 4 && if (((u32)start >= (u32)g_main_cp_state.matrix_index_a.Tex0MtxIdx * 4 &&
(u32)start < (u32)g_main_cp_state.matrix_index_a.Tex0MtxIdx * 4 + 12) || (u32)start < (u32)g_main_cp_state.matrix_index_a.Tex0MtxIdx * 4 + 12) ||
((u32)start >= (u32)g_main_cp_state.matrix_index_a.Tex1MtxIdx * 4 && ((u32)start >= (u32)g_main_cp_state.matrix_index_a.Tex1MtxIdx * 4 &&
@ -174,8 +162,6 @@ void XFStateManager::SetTexMatrixChangedA(u32 Value)
if (g_main_cp_state.matrix_index_a.Hex != Value) if (g_main_cp_state.matrix_index_a.Hex != Value)
{ {
g_vertex_manager->Flush(); g_vertex_manager->Flush();
if (g_main_cp_state.matrix_index_a.PosNormalMtxIdx != (Value & 0x3f))
m_pos_normal_matrix_changed = true;
m_tex_matrices_changed[0] = true; m_tex_matrices_changed[0] = true;
g_main_cp_state.matrix_index_a.Hex = Value; g_main_cp_state.matrix_index_a.Hex = Value;
} }
@ -201,11 +187,6 @@ void XFStateManager::ResetTexMatrixBChange()
m_tex_matrices_changed[1] = false; m_tex_matrices_changed[1] = false;
} }
void XFStateManager::ResetPosNormalChange()
{
m_pos_normal_matrix_changed = false;
}
void XFStateManager::SetProjectionChanged() void XFStateManager::SetProjectionChanged()
{ {
m_projection_changed = true; m_projection_changed = true;

View File

@ -27,9 +27,6 @@ public:
bool DidTexMatrixBChange() const { return m_tex_matrices_changed[1]; } bool DidTexMatrixBChange() const { return m_tex_matrices_changed[1]; }
void ResetTexMatrixBChange(); void ResetTexMatrixBChange();
bool DidPosNormalChange() const { return m_pos_normal_matrix_changed; }
void ResetPosNormalChange();
void SetProjectionChanged(); void SetProjectionChanged();
bool DidProjectionChange() const { return m_projection_changed; } bool DidProjectionChange() const { return m_projection_changed; }
void ResetProjection(); void ResetProjection();
@ -74,7 +71,6 @@ public:
private: private:
// track changes // track changes
std::array<bool, 2> m_tex_matrices_changed{}; std::array<bool, 2> m_tex_matrices_changed{};
bool m_pos_normal_matrix_changed = false;
bool m_projection_changed = false; bool m_projection_changed = false;
bool m_viewport_changed = false; bool m_viewport_changed = false;
bool m_tex_mtx_info_changed = false; bool m_tex_mtx_info_changed = false;