Merge pull request #10864 from TellowKrinkle/BetterLogicBlend
VideoCommon: Better logic op invert approximation
This commit is contained in:
commit
0f037a1af8
|
@ -744,6 +744,7 @@ static void WriteAlphaTest(ShaderCode& out, const pixel_shader_uid_data* uid_dat
|
||||||
bool per_pixel_depth, bool use_dual_source);
|
bool per_pixel_depth, bool use_dual_source);
|
||||||
static void WriteFog(ShaderCode& out, const pixel_shader_uid_data* uid_data);
|
static void WriteFog(ShaderCode& out, const pixel_shader_uid_data* uid_data);
|
||||||
static void WriteLogicOp(ShaderCode& out, const pixel_shader_uid_data* uid_data);
|
static void WriteLogicOp(ShaderCode& out, const pixel_shader_uid_data* uid_data);
|
||||||
|
static void WriteLogicOpBlend(ShaderCode& out, const pixel_shader_uid_data* uid_data);
|
||||||
static void WriteColor(ShaderCode& out, APIType api_type, const pixel_shader_uid_data* uid_data,
|
static void WriteColor(ShaderCode& out, APIType api_type, const pixel_shader_uid_data* uid_data,
|
||||||
bool use_dual_source);
|
bool use_dual_source);
|
||||||
static void WriteBlend(ShaderCode& out, const pixel_shader_uid_data* uid_data);
|
static void WriteBlend(ShaderCode& out, const pixel_shader_uid_data* uid_data);
|
||||||
|
@ -1148,6 +1149,8 @@ ShaderCode GeneratePixelShaderCode(APIType api_type, const ShaderHostConfig& hos
|
||||||
|
|
||||||
if (uid_data->logic_op_enable)
|
if (uid_data->logic_op_enable)
|
||||||
WriteLogicOp(out, uid_data);
|
WriteLogicOp(out, uid_data);
|
||||||
|
else if (uid_data->emulate_logic_op_with_blend)
|
||||||
|
WriteLogicOpBlend(out, uid_data);
|
||||||
|
|
||||||
// Write the color and alpha values to the framebuffer
|
// Write the color and alpha values to the framebuffer
|
||||||
// If using shader blend, we still use the separate alpha
|
// If using shader blend, we still use the separate alpha
|
||||||
|
@ -1803,6 +1806,29 @@ static void WriteLogicOp(ShaderCode& out, const pixel_shader_uid_data* uid_data)
|
||||||
out.Write("\tprev = ({}) & 0xff;\n", logic_op_mode[uid_data->logic_op_mode]);
|
out.Write("\tprev = ({}) & 0xff;\n", logic_op_mode[uid_data->logic_op_mode]);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void WriteLogicOpBlend(ShaderCode& out, const pixel_shader_uid_data* uid_data)
|
||||||
|
{
|
||||||
|
switch (static_cast<LogicOp>(uid_data->logic_op_mode))
|
||||||
|
{
|
||||||
|
case LogicOp::Clear:
|
||||||
|
case LogicOp::NoOp:
|
||||||
|
out.Write("\tprev = int4(0, 0, 0, 0);\n");
|
||||||
|
break;
|
||||||
|
case LogicOp::Copy:
|
||||||
|
// Do nothing!
|
||||||
|
break;
|
||||||
|
case LogicOp::CopyInverted:
|
||||||
|
out.Write("\tprev ^= 255;\n");
|
||||||
|
break;
|
||||||
|
case LogicOp::Set:
|
||||||
|
case LogicOp::Invert: // In cooperation with blend
|
||||||
|
out.Write("\tprev = int4(255, 255, 255, 255);\n");
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
static void WriteColor(ShaderCode& out, APIType api_type, const pixel_shader_uid_data* uid_data,
|
static void WriteColor(ShaderCode& out, APIType api_type, const pixel_shader_uid_data* uid_data,
|
||||||
bool use_dual_source)
|
bool use_dual_source)
|
||||||
{
|
{
|
||||||
|
|
|
@ -58,8 +58,9 @@ struct pixel_shader_uid_data
|
||||||
DstBlendFactor blend_dst_factor_alpha : 3; // Only used with shader_framebuffer_fetch blend
|
DstBlendFactor blend_dst_factor_alpha : 3; // Only used with shader_framebuffer_fetch blend
|
||||||
u32 blend_subtract : 1; // Only used with shader_framebuffer_fetch blend
|
u32 blend_subtract : 1; // Only used with shader_framebuffer_fetch blend
|
||||||
u32 blend_subtract_alpha : 1; // Only used with shader_framebuffer_fetch blend
|
u32 blend_subtract_alpha : 1; // Only used with shader_framebuffer_fetch blend
|
||||||
|
u32 emulate_logic_op_with_blend : 1; // Only used with logic op blend emulation
|
||||||
u32 logic_op_enable : 1; // Only used with shader_framebuffer_fetch logic ops
|
u32 logic_op_enable : 1; // Only used with shader_framebuffer_fetch logic ops
|
||||||
u32 logic_op_mode : 4; // Only used with shader_framebuffer_fetch logic ops
|
u32 logic_op_mode : 4; // Only used with shader_framebuffer_fetch logic ops and blend emulation
|
||||||
|
|
||||||
u32 texMtxInfo_n_projection : 8; // 8x1 bit
|
u32 texMtxInfo_n_projection : 8; // 8x1 bit
|
||||||
u32 tevindref_bi0 : 3;
|
u32 tevindref_bi0 : 3;
|
||||||
|
|
|
@ -185,6 +185,7 @@ void BlendingState::ApproximateLogicOpWithBlending()
|
||||||
{
|
{
|
||||||
struct LogicOpApproximation
|
struct LogicOpApproximation
|
||||||
{
|
{
|
||||||
|
bool blendEnable;
|
||||||
bool subtract;
|
bool subtract;
|
||||||
SrcBlendFactor srcfactor;
|
SrcBlendFactor srcfactor;
|
||||||
DstBlendFactor dstfactor;
|
DstBlendFactor dstfactor;
|
||||||
|
@ -193,31 +194,69 @@ void BlendingState::ApproximateLogicOpWithBlending()
|
||||||
// but INVSRCCLR and INVDSTCLR were also aliased and were mixed.
|
// but INVSRCCLR and INVDSTCLR were also aliased and were mixed.
|
||||||
// Thus, NOR, EQUIV, INVERT, COPY_INVERTED, and OR_INVERTED duplicate(d) other values.
|
// Thus, NOR, EQUIV, INVERT, COPY_INVERTED, and OR_INVERTED duplicate(d) other values.
|
||||||
static constexpr std::array<LogicOpApproximation, 16> approximations = {{
|
static constexpr std::array<LogicOpApproximation, 16> approximations = {{
|
||||||
{false, SrcBlendFactor::Zero, DstBlendFactor::Zero}, // CLEAR
|
// clang-format off
|
||||||
{false, SrcBlendFactor::DstClr, DstBlendFactor::Zero}, // AND
|
{false, false, SrcBlendFactor::One, DstBlendFactor::Zero}, // CLEAR (Shader outputs 0)
|
||||||
{true, SrcBlendFactor::One, DstBlendFactor::InvSrcClr}, // AND_REVERSE
|
{true, false, SrcBlendFactor::DstClr, DstBlendFactor::Zero}, // AND
|
||||||
{false, SrcBlendFactor::One, DstBlendFactor::Zero}, // COPY
|
{true, true, SrcBlendFactor::One, DstBlendFactor::InvSrcClr}, // AND_REVERSE
|
||||||
{true, SrcBlendFactor::DstClr, DstBlendFactor::One}, // AND_INVERTED
|
{false, false, SrcBlendFactor::One, DstBlendFactor::Zero}, // COPY
|
||||||
{false, SrcBlendFactor::Zero, DstBlendFactor::One}, // NOOP
|
{true, true, SrcBlendFactor::DstClr, DstBlendFactor::One}, // AND_INVERTED
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // XOR
|
{true, false, SrcBlendFactor::Zero, DstBlendFactor::One}, // NOOP
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::One}, // OR
|
{true, false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // XOR
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // NOR
|
{true, false, SrcBlendFactor::InvDstClr, DstBlendFactor::One}, // OR
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::Zero}, // EQUIV
|
{true, false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // NOR
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // INVERT
|
{true, false, SrcBlendFactor::InvDstClr, DstBlendFactor::Zero}, // EQUIV
|
||||||
{false, SrcBlendFactor::One, DstBlendFactor::InvDstAlpha}, // OR_REVERSE
|
{true, false, SrcBlendFactor::InvDstClr, DstBlendFactor::Zero}, // INVERT (Shader outputs 255)
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // COPY_INVERTED
|
{true, false, SrcBlendFactor::One, DstBlendFactor::InvDstAlpha}, // OR_REVERSE
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::One}, // OR_INVERTED
|
{false, false, SrcBlendFactor::One, DstBlendFactor::Zero}, // COPY_INVERTED (Shader inverts)
|
||||||
{false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // NAND
|
{true, false, SrcBlendFactor::InvDstClr, DstBlendFactor::One}, // OR_INVERTED
|
||||||
{false, SrcBlendFactor::One, DstBlendFactor::One}, // SET
|
{true, false, SrcBlendFactor::InvDstClr, DstBlendFactor::InvSrcClr}, // NAND
|
||||||
|
{false, false, SrcBlendFactor::One, DstBlendFactor::Zero}, // SET (Shader outputs 255)
|
||||||
|
// clang-format on
|
||||||
}};
|
}};
|
||||||
|
|
||||||
logicopenable = false;
|
logicopenable = false;
|
||||||
blendenable = true;
|
usedualsrc = false;
|
||||||
subtract = approximations[u32(logicmode.Value())].subtract;
|
const LogicOpApproximation& approximation = approximations[static_cast<u32>(logicmode.Value())];
|
||||||
srcfactor = approximations[u32(logicmode.Value())].srcfactor;
|
if (approximation.blendEnable)
|
||||||
srcfactoralpha = approximations[u32(logicmode.Value())].srcfactor;
|
{
|
||||||
dstfactor = approximations[u32(logicmode.Value())].dstfactor;
|
blendenable = true;
|
||||||
dstfactoralpha = approximations[u32(logicmode.Value())].dstfactor;
|
subtract = approximation.subtract;
|
||||||
|
srcfactor = approximation.srcfactor;
|
||||||
|
srcfactoralpha = approximation.srcfactor;
|
||||||
|
dstfactor = approximation.dstfactor;
|
||||||
|
dstfactoralpha = approximation.dstfactor;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
bool BlendingState::LogicOpApproximationIsExact()
|
||||||
|
{
|
||||||
|
switch (logicmode.Value())
|
||||||
|
{
|
||||||
|
case LogicOp::Clear:
|
||||||
|
case LogicOp::Set:
|
||||||
|
case LogicOp::NoOp:
|
||||||
|
case LogicOp::Invert:
|
||||||
|
case LogicOp::CopyInverted:
|
||||||
|
case LogicOp::Copy:
|
||||||
|
return true;
|
||||||
|
default:
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
bool BlendingState::LogicOpApproximationWantsShaderHelp()
|
||||||
|
{
|
||||||
|
switch (logicmode.Value())
|
||||||
|
{
|
||||||
|
case LogicOp::Clear:
|
||||||
|
case LogicOp::Set:
|
||||||
|
case LogicOp::NoOp:
|
||||||
|
case LogicOp::Invert:
|
||||||
|
case LogicOp::CopyInverted:
|
||||||
|
return true;
|
||||||
|
default:
|
||||||
|
return false;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void SamplerState::Generate(const BPMemory& bp, u32 index)
|
void SamplerState::Generate(const BPMemory& bp, u32 index)
|
||||||
|
|
|
@ -109,6 +109,8 @@ union BlendingState
|
||||||
// HACK: Replaces logical operations with blend operations.
|
// HACK: Replaces logical operations with blend operations.
|
||||||
// Will not be bit-correct, and in some cases not even remotely in the same ballpark.
|
// Will not be bit-correct, and in some cases not even remotely in the same ballpark.
|
||||||
void ApproximateLogicOpWithBlending();
|
void ApproximateLogicOpWithBlending();
|
||||||
|
bool LogicOpApproximationIsExact();
|
||||||
|
bool LogicOpApproximationWantsShaderHelp();
|
||||||
|
|
||||||
BlendingState() = default;
|
BlendingState() = default;
|
||||||
BlendingState(const BlendingState&) = default;
|
BlendingState(const BlendingState&) = default;
|
||||||
|
|
|
@ -601,16 +601,6 @@ AbstractPipelineConfig ShaderCache::GetGXPipelineConfig(
|
||||||
config.depth_state = depth_state;
|
config.depth_state = depth_state;
|
||||||
config.blending_state = blending_state;
|
config.blending_state = blending_state;
|
||||||
config.framebuffer_state = g_framebuffer_manager->GetEFBFramebufferState();
|
config.framebuffer_state = g_framebuffer_manager->GetEFBFramebufferState();
|
||||||
|
|
||||||
// We can use framebuffer fetch to emulate logic ops in the fragment shader.
|
|
||||||
if (config.blending_state.logicopenable && !g_ActiveConfig.backend_info.bSupportsLogicOp &&
|
|
||||||
!g_ActiveConfig.backend_info.bSupportsFramebufferFetch)
|
|
||||||
{
|
|
||||||
WARN_LOG_FMT(VIDEO,
|
|
||||||
"Approximating logic op with blending, this will produce incorrect rendering.");
|
|
||||||
config.blending_state.ApproximateLogicOpWithBlending();
|
|
||||||
}
|
|
||||||
|
|
||||||
return config;
|
return config;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -628,6 +618,22 @@ static GXPipelineUid ApplyDriverBugs(const GXPipelineUid& in)
|
||||||
ps->ztest = EmulatedZ::Early;
|
ps->ztest = EmulatedZ::Early;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// If framebuffer fetch is available, we can emulate logic ops in the fragment shader
|
||||||
|
// and don't need the below blend approximation
|
||||||
|
if (blend.logicopenable && !g_ActiveConfig.backend_info.bSupportsLogicOp &&
|
||||||
|
!g_ActiveConfig.backend_info.bSupportsFramebufferFetch)
|
||||||
|
{
|
||||||
|
if (!blend.LogicOpApproximationIsExact())
|
||||||
|
WARN_LOG_FMT(VIDEO,
|
||||||
|
"Approximating logic op with blending, this will produce incorrect rendering.");
|
||||||
|
if (blend.LogicOpApproximationWantsShaderHelp())
|
||||||
|
{
|
||||||
|
ps->emulate_logic_op_with_blend = true;
|
||||||
|
ps->logic_op_mode = static_cast<u32>(blend.logicmode.Value());
|
||||||
|
}
|
||||||
|
blend.ApproximateLogicOpWithBlending();
|
||||||
|
}
|
||||||
|
|
||||||
const bool benefits_from_ps_dual_source_off =
|
const bool benefits_from_ps_dual_source_off =
|
||||||
(!g_ActiveConfig.backend_info.bSupportsDualSourceBlend &&
|
(!g_ActiveConfig.backend_info.bSupportsDualSourceBlend &&
|
||||||
g_ActiveConfig.backend_info.bSupportsFramebufferFetch) ||
|
g_ActiveConfig.backend_info.bSupportsFramebufferFetch) ||
|
||||||
|
@ -775,6 +781,18 @@ static GXUberPipelineUid ApplyDriverBugs(const GXUberPipelineUid& in)
|
||||||
memcpy(&out, &in, sizeof(out)); // Copy padding
|
memcpy(&out, &in, sizeof(out)); // Copy padding
|
||||||
if (g_ActiveConfig.backend_info.bSupportsDynamicVertexLoader)
|
if (g_ActiveConfig.backend_info.bSupportsDynamicVertexLoader)
|
||||||
out.vertex_format = nullptr;
|
out.vertex_format = nullptr;
|
||||||
|
|
||||||
|
// If framebuffer fetch is available, we can emulate logic ops in the fragment shader
|
||||||
|
// and don't need the below blend approximation
|
||||||
|
if (out.blending_state.logicopenable && !g_ActiveConfig.backend_info.bSupportsLogicOp &&
|
||||||
|
!g_ActiveConfig.backend_info.bSupportsFramebufferFetch)
|
||||||
|
{
|
||||||
|
if (!out.blending_state.LogicOpApproximationIsExact())
|
||||||
|
WARN_LOG_FMT(VIDEO,
|
||||||
|
"Approximating logic op with blending, this will produce incorrect rendering.");
|
||||||
|
out.blending_state.ApproximateLogicOpWithBlending();
|
||||||
|
}
|
||||||
|
|
||||||
if (g_ActiveConfig.backend_info.bSupportsFramebufferFetch)
|
if (g_ActiveConfig.backend_info.bSupportsFramebufferFetch)
|
||||||
{
|
{
|
||||||
// Always blend in shader
|
// Always blend in shader
|
||||||
|
|
|
@ -1092,6 +1092,26 @@ ShaderCode GenPixelShader(APIType api_type, const ShaderHostConfig& host_config,
|
||||||
" TevResult &= 0xff;\n"
|
" TevResult &= 0xff;\n"
|
||||||
" }}\n");
|
" }}\n");
|
||||||
}
|
}
|
||||||
|
else if (!host_config.backend_logic_op)
|
||||||
|
{
|
||||||
|
out.Write(" // Helpers for logic op blending approximations\n"
|
||||||
|
" if (logic_op_enable) {{\n"
|
||||||
|
" switch (logic_op_mode) {{\n");
|
||||||
|
out.Write(" case {}: // Clear\n", static_cast<u32>(LogicOp::Clear));
|
||||||
|
out.Write(" TevResult = int4(0, 0, 0, 0);\n"
|
||||||
|
" break;\n");
|
||||||
|
out.Write(" case {}: // Copy Inverted\n", static_cast<u32>(LogicOp::CopyInverted));
|
||||||
|
out.Write(" TevResult ^= 0xff;\n"
|
||||||
|
" break;\n");
|
||||||
|
out.Write(" case {}: // Set\n", static_cast<u32>(LogicOp::Set));
|
||||||
|
out.Write(" case {}: // Invert\n", static_cast<u32>(LogicOp::Invert));
|
||||||
|
out.Write(" TevResult = int4(255, 255, 255, 255);\n"
|
||||||
|
" break;\n");
|
||||||
|
out.Write(" default:\n"
|
||||||
|
" break;\n"
|
||||||
|
" }}\n"
|
||||||
|
" }}\n");
|
||||||
|
}
|
||||||
|
|
||||||
// Some backends require that the shader outputs be uint when writing to a uint render target for
|
// Some backends require that the shader outputs be uint when writing to a uint render target for
|
||||||
// logic op.
|
// logic op.
|
||||||
|
|
Loading…
Reference in New Issue