[D3D12] Convert GlslShaderTranslator flow control to HLSL
This commit is contained in:
parent
7afc40820b
commit
d60c8b29ca
|
@ -26,11 +26,20 @@ HlslShaderTranslator::~HlslShaderTranslator() = default;
|
||||||
|
|
||||||
void HlslShaderTranslator::Reset() {
|
void HlslShaderTranslator::Reset() {
|
||||||
ShaderTranslator::Reset();
|
ShaderTranslator::Reset();
|
||||||
|
|
||||||
|
source_.Reset();
|
||||||
depth_ = 0;
|
depth_ = 0;
|
||||||
depth_prefix[0] = 0;
|
depth_prefix[0] = 0;
|
||||||
source_.Reset();
|
|
||||||
|
cf_wrote_pc_ = false;
|
||||||
|
cf_exec_pred_ = false;
|
||||||
|
cf_exec_pred_cond_ = false;
|
||||||
|
|
||||||
srv_bindings_.clear();
|
srv_bindings_.clear();
|
||||||
|
|
||||||
sampler_count_ = 0;
|
sampler_count_ = 0;
|
||||||
|
|
||||||
|
cube_used_ = false;
|
||||||
}
|
}
|
||||||
|
|
||||||
void HlslShaderTranslator::EmitTranslationError(const char* message) {
|
void HlslShaderTranslator::EmitTranslationError(const char* message) {
|
||||||
|
@ -134,7 +143,13 @@ void HlslShaderTranslator::StartTranslation() {
|
||||||
"XePixelShaderOutput main(XePixelShaderInput xe_input) {\n"
|
"XePixelShaderOutput main(XePixelShaderInput xe_input) {\n"
|
||||||
" float4 xe_r[%u];\n"
|
" float4 xe_r[%u];\n"
|
||||||
" XePixelShaderOutput xe_output;\n",
|
" XePixelShaderOutput xe_output;\n",
|
||||||
kMaxInterpolators, std::max(register_count(), kMaxInterpolators));
|
kMaxInterpolators, register_count());
|
||||||
|
// Copy interpolators to the first registers.
|
||||||
|
uint32_t interpolator_register_count =
|
||||||
|
std::min(register_count(), kMaxInterpolators);
|
||||||
|
for (uint32_t i = 0; i < interpolator_register_count; ++i) {
|
||||||
|
EmitSource(" xe_r[%u] = xe_input.interpolators[%u];\n", i, i);
|
||||||
|
}
|
||||||
// No need to write zero to every output because in case an output is
|
// No need to write zero to every output because in case an output is
|
||||||
// completely unused, writing to that render target will be disabled in the
|
// completely unused, writing to that render target will be disabled in the
|
||||||
// blending state (in Halo 3, one important render target is destroyed by a
|
// blending state (in Halo 3, one important render target is destroyed by a
|
||||||
|
@ -143,7 +158,13 @@ void HlslShaderTranslator::StartTranslation() {
|
||||||
}
|
}
|
||||||
|
|
||||||
EmitSource(
|
EmitSource(
|
||||||
// Predicate temp, clause-local.
|
// Float constant index for dynamic indexing.
|
||||||
|
" uint xe_float_constant_index;\n"
|
||||||
|
// Previous vector result (used as a scratch).
|
||||||
|
" float4 xe_pv;\n"
|
||||||
|
// Previous scalar result (used for RETAIN_PREV).
|
||||||
|
" float xe_ps;\n"
|
||||||
|
// Predicate temp, clause-local. Initially false like cf_exec_pred_cond_.
|
||||||
" bool xe_p0 = false;\n"
|
" bool xe_p0 = false;\n"
|
||||||
// Address register when using absolute addressing.
|
// Address register when using absolute addressing.
|
||||||
" int xe_a0 = 0;\n"
|
" int xe_a0 = 0;\n"
|
||||||
|
@ -151,11 +172,7 @@ void HlslShaderTranslator::StartTranslation() {
|
||||||
" int4 xe_aL = int4(0, 0, 0, 0);\n"
|
" int4 xe_aL = int4(0, 0, 0, 0);\n"
|
||||||
// Loop counter stack, .x is the active loop.
|
// Loop counter stack, .x is the active loop.
|
||||||
// Represents number of times remaining to loop.
|
// Represents number of times remaining to loop.
|
||||||
" int4 xe_loop_count = int4(0, 0, 0, 0);\n"
|
" uint4 xe_loop_count = uint4(0u, 0u, 0u, 0u);\n"
|
||||||
// Previous vector result (used as a scratch).
|
|
||||||
" float4 xe_pv;\n"
|
|
||||||
// Previous scalar result (used for RETAIN_PREV).
|
|
||||||
" float xe_ps;\n"
|
|
||||||
// Master loop and switch for flow control.
|
// Master loop and switch for flow control.
|
||||||
" uint xe_pc = 0u;\n"
|
" uint xe_pc = 0u;\n"
|
||||||
"\n"
|
"\n"
|
||||||
|
@ -169,6 +186,194 @@ void HlslShaderTranslator::StartTranslation() {
|
||||||
Indent();
|
Indent();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessLabel(uint32_t cf_index) {
|
||||||
|
// 0 is always added in the beginning.
|
||||||
|
if (cf_index != 0) {
|
||||||
|
EmitSourceDepth("case %u:\n", cf_index);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessControlFlowNopInstruction(uint32_t cf_index) {
|
||||||
|
EmitSourceDepth("// cnop\n");
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessControlFlowInstructionBegin(
|
||||||
|
uint32_t cf_index) {
|
||||||
|
cf_wrote_pc_ = false;
|
||||||
|
Indent();
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessControlFlowInstructionEnd(uint32_t cf_index) {
|
||||||
|
if (!cf_wrote_pc_) {
|
||||||
|
EmitSourceDepth("// Falling through to L%u\n", cf_index + 1);
|
||||||
|
}
|
||||||
|
Unindent();
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessExecInstructionBegin(
|
||||||
|
const ParsedExecInstruction& instr) {
|
||||||
|
EmitSourceDepth("// ");
|
||||||
|
instr.Disassemble(&source_);
|
||||||
|
|
||||||
|
cf_exec_pred_ = false;
|
||||||
|
switch (instr.type) {
|
||||||
|
case ParsedExecInstruction::Type::kUnconditional:
|
||||||
|
EmitSourceDepth("{\n");
|
||||||
|
break;
|
||||||
|
case ParsedExecInstruction::Type::kConditional:
|
||||||
|
EmitSourceDepth("if ((xe_bool_constants[%u] & (1u << %uu)) %c= 0u) {\n",
|
||||||
|
instr.bool_constant_index >> 5,
|
||||||
|
instr.bool_constant_index & 31,
|
||||||
|
instr.condition ? '!' : '=');
|
||||||
|
break;
|
||||||
|
case ParsedExecInstruction::Type::kPredicated:
|
||||||
|
cf_exec_pred_ = true;
|
||||||
|
cf_exec_pred_cond_ = instr.condition;
|
||||||
|
EmitSourceDepth("if (%cxe_p0) {\n", instr.condition ? ' ' : '!');
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
Indent();
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessExecInstructionEnd(
|
||||||
|
const ParsedExecInstruction& instr) {
|
||||||
|
if (instr.is_end) {
|
||||||
|
EmitSourceDepth("xe_pc = 0xFFFFu;\n");
|
||||||
|
EmitSourceDepth("break;\n");
|
||||||
|
cf_wrote_pc_ = true;
|
||||||
|
}
|
||||||
|
Unindent();
|
||||||
|
EmitSourceDepth("}\n");
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessLoopStartInstruction(
|
||||||
|
const ParsedLoopStartInstruction& instr) {
|
||||||
|
EmitSourceDepth("// ");
|
||||||
|
instr.Disassemble(&source_);
|
||||||
|
|
||||||
|
// Setup counter.
|
||||||
|
EmitSourceDepth("xe_loop_count.yzw = xe_loop_count.xyz;\n");
|
||||||
|
EmitSourceDepth("xe_loop_count.x = xe_loop_constants[%u] & 0xFFu;\n");
|
||||||
|
|
||||||
|
// Setup relative indexing.
|
||||||
|
EmitSourceDepth("xe_aL = xe_aL.xxyz;\n");
|
||||||
|
if (!instr.is_repeat) {
|
||||||
|
// Push new loop starting index if not reusing the current one.
|
||||||
|
EmitSourceDepth("xe_aL.x = int((xe_loop_constants[%u] >> 8u) & 0xFFu);\n");
|
||||||
|
}
|
||||||
|
|
||||||
|
// Quick skip loop if zero count.
|
||||||
|
EmitSourceDepth("if (xe_loop_count.x == 0u) {\n");
|
||||||
|
EmitSourceDepth(" xe_pc = %u; // Skip loop to L%u\n",
|
||||||
|
instr.loop_skip_address, instr.loop_skip_address);
|
||||||
|
EmitSourceDepth("} else {\n");
|
||||||
|
EmitSourceDepth(" xe_pc = %u; // Fallthrough to loop body L%u\n",
|
||||||
|
instr.dword_index + 1, instr.dword_index + 1);
|
||||||
|
EmitSourceDepth("}\n");
|
||||||
|
EmitSourceDepth("break;\n");
|
||||||
|
cf_wrote_pc_ = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessLoopEndInstruction(
|
||||||
|
const ParsedLoopEndInstruction& instr) {
|
||||||
|
EmitSourceDepth("// ");
|
||||||
|
instr.Disassemble(&source_);
|
||||||
|
|
||||||
|
// Decrement loop counter, and if we are done break out.
|
||||||
|
EmitSourceDepth("if (--xe_loop_count.x == 0u");
|
||||||
|
if (instr.is_predicated_break) {
|
||||||
|
// If the predicate condition is met we 'break;' out of the loop.
|
||||||
|
// Need to restore stack and fall through to the next cf.
|
||||||
|
EmitSource(" || %cxe_p0) {\n", instr.predicate_condition ? ' ' : '!');
|
||||||
|
} else {
|
||||||
|
EmitSource(") {\n");
|
||||||
|
}
|
||||||
|
Indent();
|
||||||
|
|
||||||
|
// Loop completed - pop and fall through to next cf.
|
||||||
|
EmitSourceDepth("xe_loop_count.xyz = xe_loop_count.yzw;\n");
|
||||||
|
EmitSourceDepth("xe_loop_count.w = 0u;\n");
|
||||||
|
EmitSourceDepth("xe_aL.xyz = xe_aL.yzw;\n");
|
||||||
|
EmitSourceDepth("xe_aL.w = 0;\n");
|
||||||
|
EmitSourceDepth("xe_pc = %u; // Exit loop to L%u\n", instr.dword_index + 1,
|
||||||
|
instr.dword_index + 1);
|
||||||
|
|
||||||
|
Unindent();
|
||||||
|
EmitSourceDepth("} else {\n");
|
||||||
|
Indent();
|
||||||
|
|
||||||
|
// Still looping. Adjust index and jump back to body.
|
||||||
|
EmitSourceDepth("xe_aL.x += int((xe_loop_constants[%u] << 8u) >> 24u);\n",
|
||||||
|
instr.loop_constant_index);
|
||||||
|
EmitSourceDepth("xe_pc = %u; // Loop back to body L%u\n",
|
||||||
|
instr.loop_body_address, instr.loop_body_address);
|
||||||
|
|
||||||
|
Unindent();
|
||||||
|
EmitSourceDepth("}\n");
|
||||||
|
EmitSourceDepth("break;\n");
|
||||||
|
cf_wrote_pc_ = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessCallInstruction(
|
||||||
|
const ParsedCallInstruction& instr) {
|
||||||
|
EmitSourceDepth("// ");
|
||||||
|
instr.Disassemble(&source_);
|
||||||
|
|
||||||
|
EmitUnimplementedTranslationError();
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessReturnInstruction(
|
||||||
|
const ParsedReturnInstruction& instr) {
|
||||||
|
EmitSourceDepth("// ");
|
||||||
|
instr.Disassemble(&source_);
|
||||||
|
|
||||||
|
EmitUnimplementedTranslationError();
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessJumpInstruction(
|
||||||
|
const ParsedJumpInstruction& instr) {
|
||||||
|
EmitSourceDepth("// ");
|
||||||
|
instr.Disassemble(&source_);
|
||||||
|
|
||||||
|
bool needs_fallthrough = false;
|
||||||
|
switch (instr.type) {
|
||||||
|
case ParsedJumpInstruction::Type::kUnconditional:
|
||||||
|
EmitSourceDepth("{\n");
|
||||||
|
break;
|
||||||
|
case ParsedJumpInstruction::Type::kConditional:
|
||||||
|
EmitSourceDepth("if ((xe_bool_constants[%u] & (1u << %uu)) %c= 0u) {\n",
|
||||||
|
instr.bool_constant_index >> 5,
|
||||||
|
instr.bool_constant_index & 31,
|
||||||
|
instr.condition ? '!' : '=');
|
||||||
|
needs_fallthrough = true;
|
||||||
|
break;
|
||||||
|
case ParsedJumpInstruction::Type::kPredicated:
|
||||||
|
EmitSourceDepth("if (%cxe_p0) {\n", instr.condition ? ' ' : '!');
|
||||||
|
needs_fallthrough = true;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
Indent();
|
||||||
|
|
||||||
|
EmitSourceDepth("xe_pc = %u; // L%u\n", instr.target_address,
|
||||||
|
instr.target_address);
|
||||||
|
EmitSourceDepth("break;\n");
|
||||||
|
|
||||||
|
Unindent();
|
||||||
|
if (needs_fallthrough) {
|
||||||
|
uint32_t next_address = instr.dword_index + 1;
|
||||||
|
EmitSourceDepth("} else {\n");
|
||||||
|
EmitSourceDepth(" xe_pc = %u; // Fallthrough to L%u\n", next_address,
|
||||||
|
next_address);
|
||||||
|
}
|
||||||
|
EmitSourceDepth("}\n");
|
||||||
|
}
|
||||||
|
|
||||||
|
void HlslShaderTranslator::ProcessAllocInstruction(
|
||||||
|
const ParsedAllocInstruction& instr) {
|
||||||
|
EmitSourceDepth("// ");
|
||||||
|
instr.Disassemble(&source_);
|
||||||
|
}
|
||||||
|
|
||||||
uint32_t HlslShaderTranslator::AddSRVBinding(SRVType type,
|
uint32_t HlslShaderTranslator::AddSRVBinding(SRVType type,
|
||||||
uint32_t fetch_constant) {
|
uint32_t fetch_constant) {
|
||||||
for (uint32_t i = 0; i < srv_bindings_.size(); ++i) {
|
for (uint32_t i = 0; i < srv_bindings_.size(); ++i) {
|
||||||
|
|
|
@ -46,6 +46,22 @@ class HlslShaderTranslator : public ShaderTranslator {
|
||||||
void EmitTranslationError(const char* message) override;
|
void EmitTranslationError(const char* message) override;
|
||||||
void EmitUnimplementedTranslationError() override;
|
void EmitUnimplementedTranslationError() override;
|
||||||
|
|
||||||
|
void ProcessLabel(uint32_t cf_index) override;
|
||||||
|
|
||||||
|
void ProcessControlFlowNopInstruction(uint32_t cf_index) override;
|
||||||
|
void ProcessControlFlowInstructionBegin(uint32_t cf_index) override;
|
||||||
|
void ProcessControlFlowInstructionEnd(uint32_t cf_index) override;
|
||||||
|
void ProcessExecInstructionBegin(const ParsedExecInstruction& instr) override;
|
||||||
|
void ProcessExecInstructionEnd(const ParsedExecInstruction& instr) override;
|
||||||
|
void ProcessLoopStartInstruction(
|
||||||
|
const ParsedLoopStartInstruction& instr) override;
|
||||||
|
void ProcessLoopEndInstruction(
|
||||||
|
const ParsedLoopEndInstruction& instr) override;
|
||||||
|
void ProcessCallInstruction(const ParsedCallInstruction& instr) override;
|
||||||
|
void ProcessReturnInstruction(const ParsedReturnInstruction& instr) override;
|
||||||
|
void ProcessJumpInstruction(const ParsedJumpInstruction& instr) override;
|
||||||
|
void ProcessAllocInstruction(const ParsedAllocInstruction& instr) override;
|
||||||
|
|
||||||
private:
|
private:
|
||||||
void Indent();
|
void Indent();
|
||||||
void Unindent();
|
void Unindent();
|
||||||
|
@ -54,6 +70,10 @@ class HlslShaderTranslator : public ShaderTranslator {
|
||||||
uint32_t depth_ = 0;
|
uint32_t depth_ = 0;
|
||||||
char depth_prefix_[16] = {0};
|
char depth_prefix_[16] = {0};
|
||||||
|
|
||||||
|
bool cf_wrote_pc_ = false;
|
||||||
|
bool cf_exec_pred_ = false;
|
||||||
|
bool cf_exec_pred_cond_ = false;
|
||||||
|
|
||||||
std::vector<SRVBinding> srv_bindings_;
|
std::vector<SRVBinding> srv_bindings_;
|
||||||
// Finds or adds an SRV binding to the shader's SRV list, returns t# index.
|
// Finds or adds an SRV binding to the shader's SRV list, returns t# index.
|
||||||
uint32_t AddSRVBinding(SRVType type, uint32_t fetch_constant);
|
uint32_t AddSRVBinding(SRVType type, uint32_t fetch_constant);
|
||||||
|
@ -64,6 +84,10 @@ class HlslShaderTranslator : public ShaderTranslator {
|
||||||
uint32_t sampler_fetch_constants_[32];
|
uint32_t sampler_fetch_constants_[32];
|
||||||
uint32_t sampler_count_ = 0;
|
uint32_t sampler_count_ = 0;
|
||||||
uint32_t AddSampler(uint32_t fetch_constant);
|
uint32_t AddSampler(uint32_t fetch_constant);
|
||||||
|
|
||||||
|
// Whether the cube instruction has been used and conversion functions need to
|
||||||
|
// be emitted.
|
||||||
|
bool cube_used_ = false;
|
||||||
};
|
};
|
||||||
|
|
||||||
} // namespace gpu
|
} // namespace gpu
|
||||||
|
|
Loading…
Reference in New Issue