forked from ShuriZma/suyu
1
0
Fork 0

Merge pull request #3502 from namkazt/patch-3

shader_decode: Reimplement BFE instructions
This commit is contained in:
Rodrigo Locatti 2020-03-15 21:23:04 -03:00 committed by GitHub
commit ddafc99776
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 53 additions and 29 deletions

View File

@ -911,14 +911,9 @@ union Instruction {
} fadd32i; } fadd32i;
union { union {
BitField<20, 8, u64> shift_position; BitField<40, 1, u64> brev;
BitField<28, 8, u64> shift_length; BitField<47, 1, u64> rd_cc;
BitField<48, 1, u64> negate_b; BitField<48, 1, u64> is_signed;
BitField<49, 1, u64> negate_a;
u64 GetLeftShiftValue() const {
return 32 - (shift_position + shift_length);
}
} bfe; } bfe;
union { union {

View File

@ -17,33 +17,60 @@ u32 ShaderIR::DecodeBfe(NodeBlock& bb, u32 pc) {
const Instruction instr = {program_code[pc]}; const Instruction instr = {program_code[pc]};
const auto opcode = OpCode::Decode(instr); const auto opcode = OpCode::Decode(instr);
UNIMPLEMENTED_IF(instr.bfe.negate_b);
Node op_a = GetRegister(instr.gpr8); Node op_a = GetRegister(instr.gpr8);
op_a = GetOperandAbsNegInteger(op_a, false, instr.bfe.negate_a, false); Node op_b = [&] {
switch (opcode->get().GetId()) {
case OpCode::Id::BFE_R:
return GetRegister(instr.gpr20);
case OpCode::Id::BFE_C:
return GetConstBuffer(instr.cbuf34.index, instr.cbuf34.GetOffset());
case OpCode::Id::BFE_IMM:
return Immediate(instr.alu.GetSignedImm20_20());
default:
UNREACHABLE();
return Immediate(0);
}
}();
switch (opcode->get().GetId()) { UNIMPLEMENTED_IF_MSG(instr.bfe.rd_cc, "Condition codes in BFE is not implemented");
case OpCode::Id::BFE_IMM: {
UNIMPLEMENTED_IF_MSG(instr.generates_cc,
"Condition codes generation in BFE is not implemented");
const Node inner_shift_imm = Immediate(static_cast<u32>(instr.bfe.GetLeftShiftValue())); const bool is_signed = instr.bfe.is_signed;
const Node outer_shift_imm =
Immediate(static_cast<u32>(instr.bfe.GetLeftShiftValue() + instr.bfe.shift_position));
const Node inner_shift = // using reverse parallel method in
Operation(OperationCode::ILogicalShiftLeft, NO_PRECISE, op_a, inner_shift_imm); // https://graphics.stanford.edu/~seander/bithacks.html#ReverseParallel
const Node outer_shift = // note for later if possible to implement faster method.
Operation(OperationCode::ILogicalShiftRight, NO_PRECISE, inner_shift, outer_shift_imm); if (instr.bfe.brev) {
const auto swap = [&](u32 s, u32 mask) {
SetInternalFlagsFromInteger(bb, outer_shift, instr.generates_cc); Node v1 =
SetRegister(bb, instr.gpr0, outer_shift); SignedOperation(OperationCode::ILogicalShiftRight, is_signed, op_a, Immediate(s));
break; if (mask != 0) {
} v1 = SignedOperation(OperationCode::IBitwiseAnd, is_signed, std::move(v1),
default: Immediate(mask));
UNIMPLEMENTED_MSG("Unhandled BFE instruction: {}", opcode->get().GetName()); }
Node v2 = op_a;
if (mask != 0) {
v2 = SignedOperation(OperationCode::IBitwiseAnd, is_signed, std::move(v2),
Immediate(mask));
}
v2 = SignedOperation(OperationCode::ILogicalShiftLeft, is_signed, std::move(v2),
Immediate(s));
return SignedOperation(OperationCode::IBitwiseOr, is_signed, std::move(v1),
std::move(v2));
};
op_a = swap(1, 0x55555555U);
op_a = swap(2, 0x33333333U);
op_a = swap(4, 0x0F0F0F0FU);
op_a = swap(8, 0x00FF00FFU);
op_a = swap(16, 0);
} }
const auto offset = SignedOperation(OperationCode::IBitfieldExtract, is_signed, op_b,
Immediate(0), Immediate(8));
const auto bits = SignedOperation(OperationCode::IBitfieldExtract, is_signed, op_b,
Immediate(8), Immediate(8));
auto result = SignedOperation(OperationCode::IBitfieldExtract, is_signed, op_a, offset, bits);
SetRegister(bb, instr.gpr0, std::move(result));
return pc; return pc;
} }

View File

@ -68,6 +68,8 @@ OperationCode SignedToUnsignedCode(OperationCode operation_code, bool is_signed)
return OperationCode::UBitwiseXor; return OperationCode::UBitwiseXor;
case OperationCode::IBitwiseNot: case OperationCode::IBitwiseNot:
return OperationCode::UBitwiseNot; return OperationCode::UBitwiseNot;
case OperationCode::IBitfieldExtract:
return OperationCode::UBitfieldExtract;
case OperationCode::IBitfieldInsert: case OperationCode::IBitfieldInsert:
return OperationCode::UBitfieldInsert; return OperationCode::UBitfieldInsert;
case OperationCode::IBitCount: case OperationCode::IBitCount: