VideoCommon: Handle custom texture sizes correctly
Specifically, when using Manual Texture Sampling, if textures sizes don't match the size the game specifies, things previously broke. That can happen with custom textures, and also with scaled EFB copies at non-native IRs. It breaks most obviously by not scaling the texture coordinates (so only part of the texture shows up), but the hardware wrapping functionality also assumes texture sizes are a power of 2 (or else it will behave weirdly in a way that matches how hardware behaves weirdly). The fix is to provide alternative texture wrapping logic when custom texture sizes are possible.
This commit is contained in:
parent
93eea7cb13
commit
bdcfb31187
|
@ -568,6 +568,43 @@ int4 readTextureLinear(in Texture2DArray tex, uint2 uv1, uint2 uv2, int layer, i
|
||||||
}}
|
}}
|
||||||
)");
|
)");
|
||||||
|
|
||||||
|
if (host_config.manual_texture_sampling_custom_texture_sizes)
|
||||||
|
{
|
||||||
|
// This is slower, and doesn't result in the same odd behavior that happens on console when
|
||||||
|
// wrapping with non-power-of-2 sizes, but it's fine for custom textures to have non-console
|
||||||
|
// behavior.
|
||||||
|
out.Write(R"(
|
||||||
|
// Both GLSL and HLSL produce undefined values when the modulo operator (%) is used with a negative
|
||||||
|
// dividend and a positive divisor. We want a positive value such that SafeModulo(-1, 3) is 2.
|
||||||
|
int SafeModulo(int dividend, int divisor) {{
|
||||||
|
if (dividend >= 0) {{
|
||||||
|
return dividend % divisor;
|
||||||
|
}} else {{
|
||||||
|
// This works because ~x is the same as -x - 1.
|
||||||
|
// `~x % 5` over -5 to -1 gives 4, 3, 2, 1, 0. `4 - (~x % 5)` gives 0, 1, 2, 3, 4.
|
||||||
|
return (divisor - 1) - (~dividend % divisor);
|
||||||
|
}}
|
||||||
|
}}
|
||||||
|
|
||||||
|
uint WrapCoord(int coord, uint wrap, int size) {{
|
||||||
|
switch (wrap) {{
|
||||||
|
case {:s}:
|
||||||
|
default: // confirmed that clamp is used for invalid (3) via hardware test
|
||||||
|
return uint(clamp(coord, 0, size - 1));
|
||||||
|
case {:s}:
|
||||||
|
return uint(SafeModulo(coord, size)); // coord % size
|
||||||
|
case {:s}:
|
||||||
|
if (SafeModulo(coord, 2 * size) >= size) {{ // coord % (2 * size)
|
||||||
|
coord = ~coord;
|
||||||
|
}}
|
||||||
|
return uint(SafeModulo(coord, size)); // coord % size
|
||||||
|
}}
|
||||||
|
}}
|
||||||
|
)",
|
||||||
|
WrapMode::Clamp, WrapMode::Repeat, WrapMode::Mirror);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
out.Write(R"(
|
out.Write(R"(
|
||||||
uint WrapCoord(int coord, uint wrap, int size) {{
|
uint WrapCoord(int coord, uint wrap, int size) {{
|
||||||
switch (wrap) {{
|
switch (wrap) {{
|
||||||
|
@ -586,6 +623,7 @@ uint WrapCoord(int coord, uint wrap, int size) {{
|
||||||
)",
|
)",
|
||||||
WrapMode::Clamp, WrapMode::Repeat, WrapMode::Mirror);
|
WrapMode::Clamp, WrapMode::Repeat, WrapMode::Mirror);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
if (api_type == APIType::OpenGL || api_type == APIType::Vulkan)
|
if (api_type == APIType::OpenGL || api_type == APIType::Vulkan)
|
||||||
{
|
{
|
||||||
|
@ -616,8 +654,6 @@ uint WrapCoord(int coord, uint wrap, int size) {{
|
||||||
out.Write(R"(
|
out.Write(R"(
|
||||||
uint texmode0 = samp_texmode0(texmap);
|
uint texmode0 = samp_texmode0(texmap);
|
||||||
uint texmode1 = samp_texmode1(texmap);
|
uint texmode1 = samp_texmode1(texmap);
|
||||||
int size_s = )" I_TEXDIMS R"([texmap].x;
|
|
||||||
int size_t = )" I_TEXDIMS R"([texmap].y;
|
|
||||||
|
|
||||||
uint wrap_s = {};
|
uint wrap_s = {};
|
||||||
uint wrap_t = {};
|
uint wrap_t = {};
|
||||||
|
@ -643,6 +679,46 @@ uint WrapCoord(int coord, uint wrap, int size) {{
|
||||||
BitfieldExtract<&SamplerState::TM1::min_lod>("texmode1"),
|
BitfieldExtract<&SamplerState::TM1::min_lod>("texmode1"),
|
||||||
BitfieldExtract<&SamplerState::TM1::max_lod>("texmode1"));
|
BitfieldExtract<&SamplerState::TM1::max_lod>("texmode1"));
|
||||||
|
|
||||||
|
if (host_config.manual_texture_sampling_custom_texture_sizes)
|
||||||
|
{
|
||||||
|
out.Write(R"(
|
||||||
|
int native_size_s = )" I_TEXDIMS R"([texmap].x;
|
||||||
|
int native_size_t = )" I_TEXDIMS R"([texmap].y;
|
||||||
|
)");
|
||||||
|
|
||||||
|
if (api_type == APIType::OpenGL || api_type == APIType::Vulkan)
|
||||||
|
{
|
||||||
|
out.Write(R"(
|
||||||
|
int3 size = textureSize(tex, 0);
|
||||||
|
int size_s = size.x;
|
||||||
|
int size_t = size.y;
|
||||||
|
int number_of_levels = textureQueryLevels(tex);
|
||||||
|
)");
|
||||||
|
}
|
||||||
|
else if (api_type == APIType::D3D)
|
||||||
|
{
|
||||||
|
out.Write(R"(
|
||||||
|
int size_s, size_t, layers, number_of_levels;
|
||||||
|
tex.GetDimensions(0, size_s, size_t, layers, number_of_levels);
|
||||||
|
)");
|
||||||
|
}
|
||||||
|
|
||||||
|
out.Write(R"(
|
||||||
|
// Prevent out-of-bounds LOD values when using custom textures
|
||||||
|
max_lod = min(max_lod, (number_of_levels - 1) << 4);
|
||||||
|
// Rescale uv to account for the new texture size
|
||||||
|
uv.x = (uv.x * size_s) / native_size_s;
|
||||||
|
uv.y = (uv.y * size_t) / native_size_t;
|
||||||
|
)");
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
out.Write(R"(
|
||||||
|
int size_s = )" I_TEXDIMS R"([texmap].x;
|
||||||
|
int size_t = )" I_TEXDIMS R"([texmap].y;
|
||||||
|
)");
|
||||||
|
}
|
||||||
|
|
||||||
if (api_type == APIType::OpenGL || api_type == APIType::Vulkan)
|
if (api_type == APIType::OpenGL || api_type == APIType::Vulkan)
|
||||||
{
|
{
|
||||||
if (g_ActiveConfig.backend_info.bSupportsCoarseDerivatives)
|
if (g_ActiveConfig.backend_info.bSupportsCoarseDerivatives)
|
||||||
|
|
|
@ -40,6 +40,8 @@ ShaderHostConfig ShaderHostConfig::GetCurrent()
|
||||||
bits.backend_palette_conversion = g_ActiveConfig.backend_info.bSupportsPaletteConversion;
|
bits.backend_palette_conversion = g_ActiveConfig.backend_info.bSupportsPaletteConversion;
|
||||||
bits.enable_validation_layer = g_ActiveConfig.bEnableValidationLayer;
|
bits.enable_validation_layer = g_ActiveConfig.bEnableValidationLayer;
|
||||||
bits.manual_texture_sampling = !g_ActiveConfig.bFastTextureSampling;
|
bits.manual_texture_sampling = !g_ActiveConfig.bFastTextureSampling;
|
||||||
|
bits.manual_texture_sampling_custom_texture_sizes =
|
||||||
|
g_ActiveConfig.ManualTextureSamplingWithHiResTextures();
|
||||||
return bits;
|
return bits;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -170,6 +170,7 @@ union ShaderHostConfig
|
||||||
BitField<22, 1, bool, u32> backend_palette_conversion;
|
BitField<22, 1, bool, u32> backend_palette_conversion;
|
||||||
BitField<23, 1, bool, u32> enable_validation_layer;
|
BitField<23, 1, bool, u32> enable_validation_layer;
|
||||||
BitField<24, 1, bool, u32> manual_texture_sampling;
|
BitField<24, 1, bool, u32> manual_texture_sampling;
|
||||||
|
BitField<25, 1, bool, u32> manual_texture_sampling_custom_texture_sizes;
|
||||||
|
|
||||||
static ShaderHostConfig GetCurrent();
|
static ShaderHostConfig GetCurrent();
|
||||||
};
|
};
|
||||||
|
|
|
@ -245,6 +245,16 @@ struct VideoConfig final
|
||||||
return backend_info.bSupportsGPUTextureDecoding && bEnableGPUTextureDecoding;
|
return backend_info.bSupportsGPUTextureDecoding && bEnableGPUTextureDecoding;
|
||||||
}
|
}
|
||||||
bool UseVertexRounding() const { return bVertexRounding && iEFBScale != 1; }
|
bool UseVertexRounding() const { return bVertexRounding && iEFBScale != 1; }
|
||||||
|
bool ManualTextureSamplingWithHiResTextures() const
|
||||||
|
{
|
||||||
|
// Hi-res textures (including hi-res EFB copies, but not native-resolution EFB copies at higher
|
||||||
|
// internal resolutions) breaks the wrapping logic used by manual texture sampling.
|
||||||
|
if (bFastTextureSampling)
|
||||||
|
return false;
|
||||||
|
if (iEFBScale != 1 && bCopyEFBScaled)
|
||||||
|
return true;
|
||||||
|
return bHiresTextures;
|
||||||
|
}
|
||||||
bool UsingUberShaders() const;
|
bool UsingUberShaders() const;
|
||||||
u32 GetShaderCompilerThreads() const;
|
u32 GetShaderCompilerThreads() const;
|
||||||
u32 GetShaderPrecompilerThreads() const;
|
u32 GetShaderPrecompilerThreads() const;
|
||||||
|
|
Loading…
Reference in New Issue