[DXBC] Both v[#] and v[#][#] operands for HS and GS

This commit is contained in:
Triang3l 2022-05-07 16:17:17 +03:00
parent 5875f6ab31
commit e3425b242e
5 changed files with 145 additions and 150 deletions

View File

@ -2943,10 +2943,10 @@ D3D12RenderTargetCache::GetOrCreateTransferPipelines(TransferShaderKey key) {
kTransferSRVRegisterHostDepth)); kTransferSRVRegisterHostDepth));
} }
a.OpDclInputPSSIV(dxbc::InterpolationMode::kLinearNoPerspective, a.OpDclInputPSSIV(dxbc::InterpolationMode::kLinearNoPerspective,
dxbc::Dest::V(kInputRegisterPosition, 0b0011), dxbc::Dest::V1D(kInputRegisterPosition, 0b0011),
dxbc::Name::kPosition); dxbc::Name::kPosition);
if (key.dest_msaa_samples != xenos::MsaaSamples::k1X) { if (key.dest_msaa_samples != xenos::MsaaSamples::k1X) {
a.OpDclInputPSSGV(dxbc::Dest::V(kInputRegisterSampleIndex, 0b0001), a.OpDclInputPSSGV(dxbc::Dest::V1D(kInputRegisterSampleIndex, 0b0001),
dxbc::Name::kSampleIndex); dxbc::Name::kSampleIndex);
} }
if (osgn_parameter_index_sv_target != UINT32_MAX) { if (osgn_parameter_index_sv_target != UINT32_MAX) {
@ -2971,7 +2971,7 @@ D3D12RenderTargetCache::GetOrCreateTransferPipelines(TransferShaderKey key) {
// Split the destination pixel index into 32bpp tile in r0.z and // Split the destination pixel index into 32bpp tile in r0.z and
// 32bpp-tile-relative pixel index in r0.xy. // 32bpp-tile-relative pixel index in r0.xy.
// r0.xy = pixel XY as uint // r0.xy = pixel XY as uint
a.OpFToU(dxbc::Dest::R(0, 0b0011), dxbc::Src::V(kInputRegisterPosition)); a.OpFToU(dxbc::Dest::R(0, 0b0011), dxbc::Src::V1D(kInputRegisterPosition));
uint32_t dest_sample_width_log2 = uint32_t dest_sample_width_log2 =
uint32_t(dest_is_64bpp) + uint32_t(dest_is_64bpp) +
uint32_t(key.dest_msaa_samples >= xenos::MsaaSamples::k4X); uint32_t(key.dest_msaa_samples >= xenos::MsaaSamples::k4X);
@ -3057,7 +3057,7 @@ D3D12RenderTargetCache::GetOrCreateTransferPipelines(TransferShaderKey key) {
// If 64bpp -> 32bpp, also the needed half in r0.w. // If 64bpp -> 32bpp, also the needed half in r0.w.
dxbc::Src dest_sample( dxbc::Src dest_sample(
dxbc::Src::V(kInputRegisterSampleIndex, dxbc::Src::kXXXX)); dxbc::Src::V1D(kInputRegisterSampleIndex, dxbc::Src::kXXXX));
dxbc::Src source_sample(dest_sample); dxbc::Src source_sample(dest_sample);
uint32_t source_tile_pixel_x_reg = 0; uint32_t source_tile_pixel_x_reg = 0;
uint32_t source_tile_pixel_y_reg = 0; uint32_t source_tile_pixel_y_reg = 0;
@ -3086,7 +3086,7 @@ D3D12RenderTargetCache::GetOrCreateTransferPipelines(TransferShaderKey key) {
source_sample = dxbc::Src::R(1, dxbc::Src::kZZZZ); source_sample = dxbc::Src::R(1, dxbc::Src::kZZZZ);
a.OpBFI(dxbc::Dest::R(1, 0b0001), dxbc::Src::LU(31), dxbc::Src::LU(1), a.OpBFI(dxbc::Dest::R(1, 0b0001), dxbc::Src::LU(31), dxbc::Src::LU(1),
dxbc::Src::R(0, dxbc::Src::kXXXX), dxbc::Src::R(0, dxbc::Src::kXXXX),
dxbc::Src::V(kInputRegisterSampleIndex, dxbc::Src::kXXXX)); dxbc::Src::V1D(kInputRegisterSampleIndex, dxbc::Src::kXXXX));
source_tile_pixel_x_reg = 1; source_tile_pixel_x_reg = 1;
} else if (key.dest_msaa_samples == xenos::MsaaSamples::k2X) { } else if (key.dest_msaa_samples == xenos::MsaaSamples::k2X) {
// 32bpp -> 64bpp, 4x -> 2x. // 32bpp -> 64bpp, 4x -> 2x.
@ -3128,7 +3128,7 @@ D3D12RenderTargetCache::GetOrCreateTransferPipelines(TransferShaderKey key) {
a.OpIShL(dxbc::Dest::R(1, 0b0001), dxbc::Src::R(0, dxbc::Src::kXXXX), a.OpIShL(dxbc::Dest::R(1, 0b0001), dxbc::Src::R(0, dxbc::Src::kXXXX),
dxbc::Src::LU(2)); dxbc::Src::LU(2));
a.OpBFI(dxbc::Dest::R(1, 0b0001), dxbc::Src::LU(1), dxbc::Src::LU(1), a.OpBFI(dxbc::Dest::R(1, 0b0001), dxbc::Src::LU(1), dxbc::Src::LU(1),
dxbc::Src::V(kInputRegisterSampleIndex, dxbc::Src::kXXXX), dxbc::Src::V1D(kInputRegisterSampleIndex, dxbc::Src::kXXXX),
dxbc::Src::R(1, dxbc::Src::kXXXX)); dxbc::Src::R(1, dxbc::Src::kXXXX));
source_tile_pixel_x_reg = 1; source_tile_pixel_x_reg = 1;
// Y is handled by common code. // Y is handled by common code.

View File

@ -655,33 +655,6 @@ enum class OperandType : uint32_t {
kOutputStencilRef = 41, kOutputStencilRef = 41,
}; };
// D3D10_SB_OPERAND_INDEX_DIMENSION
constexpr uint32_t GetOperandIndexDimension(OperandType type,
bool in_dcl = false) {
switch (type) {
case OperandType::kTemp:
case OperandType::kInput:
// FIXME(Triang3l): kInput has a dimensionality of 2 in the control point
// phase of hull shaders, however, currently the translator isn't used to
// emit them - if code where this matters is emitted by Xenia, the actual
// dimensionality will need to be stored in OperandAddress itself.
case OperandType::kOutput:
case OperandType::kLabel:
return 1;
case OperandType::kIndexableTemp:
case OperandType::kInputControlPoint:
return 2;
case OperandType::kSampler:
case OperandType::kResource:
case OperandType::kUnorderedAccessView:
return in_dcl ? 3 : 2;
case OperandType::kConstantBuffer:
return 3;
default:
return 0;
}
}
// D3D10_SB_OPERAND_NUM_COMPONENTS // D3D10_SB_OPERAND_NUM_COMPONENTS
enum class OperandDimension : uint32_t { enum class OperandDimension : uint32_t {
kNoData, // D3D10_SB_OPERAND_0_COMPONENT kNoData, // D3D10_SB_OPERAND_0_COMPONENT
@ -766,11 +739,22 @@ struct Index {
struct OperandAddress { struct OperandAddress {
OperandType type_; OperandType type_;
uint32_t index_dimension_;
Index index_1d_, index_2d_, index_3d_; Index index_1d_, index_2d_, index_3d_;
explicit OperandAddress(OperandType type, Index index_1d = Index(), explicit OperandAddress(OperandType type)
Index index_2d = Index(), Index index_3d = Index()) : type_(type), index_dimension_(0) {}
explicit OperandAddress(OperandType type, Index index_1d)
: type_(type), index_dimension_(1), index_1d_(index_1d) {}
explicit OperandAddress(OperandType type, Index index_1d, Index index_2d)
: type_(type), : type_(type),
index_dimension_(2),
index_1d_(index_1d),
index_2d_(index_2d) {}
explicit OperandAddress(OperandType type, Index index_1d, Index index_2d,
Index index_3d)
: type_(type),
index_dimension_(3),
index_1d_(index_1d), index_1d_(index_1d),
index_2d_(index_2d), index_2d_(index_2d),
index_3d_(index_3d) {} index_3d_(index_3d) {}
@ -778,44 +762,38 @@ struct OperandAddress {
OperandDimension GetDimension(bool in_dcl = false) const { OperandDimension GetDimension(bool in_dcl = false) const {
return GetOperandDimension(type_, in_dcl); return GetOperandDimension(type_, in_dcl);
} }
uint32_t GetIndexDimension(bool in_dcl = false) const { uint32_t GetOperandTokenTypeAndIndex() const {
return GetOperandIndexDimension(type_, in_dcl); uint32_t operand_token = (uint32_t(type_) << 12) | (index_dimension_ << 20);
} if (index_dimension_ > 0) {
uint32_t GetOperandTokenTypeAndIndex(bool in_dcl = false) const {
uint32_t index_dimension = GetIndexDimension(in_dcl);
uint32_t operand_token = (uint32_t(type_) << 12) | (index_dimension << 20);
if (index_dimension > 0) {
operand_token |= uint32_t(index_1d_.GetRepresentation()) << 22; operand_token |= uint32_t(index_1d_.GetRepresentation()) << 22;
if (index_dimension > 1) { if (index_dimension_ > 1) {
operand_token |= uint32_t(index_2d_.GetRepresentation()) << 25; operand_token |= uint32_t(index_2d_.GetRepresentation()) << 25;
if (index_dimension > 2) { if (index_dimension_ > 2) {
operand_token |= uint32_t(index_3d_.GetRepresentation()) << 28; operand_token |= uint32_t(index_3d_.GetRepresentation()) << 28;
} }
} }
} }
return operand_token; return operand_token;
} }
uint32_t GetLength(bool in_dcl = false) const { uint32_t GetLength() const {
uint32_t length = 0; uint32_t length = 0;
uint32_t index_dimension = GetIndexDimension(in_dcl); if (index_dimension_ > 0) {
if (index_dimension > 0) {
length += index_1d_.GetLength(); length += index_1d_.GetLength();
if (index_dimension > 1) { if (index_dimension_ > 1) {
length += index_2d_.GetLength(); length += index_2d_.GetLength();
if (index_dimension > 2) { if (index_dimension_ > 2) {
length += index_3d_.GetLength(); length += index_3d_.GetLength();
} }
} }
} }
return length; return length;
} }
void Write(std::vector<uint32_t>& code, bool in_dcl = false) const { void Write(std::vector<uint32_t>& code) const {
uint32_t index_dimension = GetIndexDimension(in_dcl); if (index_dimension_ > 0) {
if (index_dimension > 0) {
index_1d_.Write(code); index_1d_.Write(code);
if (index_dimension > 1) { if (index_dimension_ > 1) {
index_2d_.Write(code); index_2d_.Write(code);
if (index_dimension > 2) { if (index_dimension_ > 2) {
index_3d_.Write(code); index_3d_.Write(code);
} }
} }
@ -845,18 +823,28 @@ struct Dest : OperandAddress {
// declarations use read masks instead of swizzle (resource declarations still // declarations use read masks instead of swizzle (resource declarations still
// use swizzle when they're vector, however). // use swizzle when they're vector, however).
explicit Dest(OperandType type, uint32_t write_mask = 0b1111, explicit Dest(OperandType type, uint32_t write_mask)
Index index_1d = Index(), Index index_2d = Index(), : OperandAddress(type), write_mask_(write_mask) {}
Index index_3d = Index()) explicit Dest(OperandType type, uint32_t write_mask, Index index_1d)
: OperandAddress(type, index_1d), write_mask_(write_mask) {}
explicit Dest(OperandType type, uint32_t write_mask, Index index_1d,
Index index_2d)
: OperandAddress(type, index_1d, index_2d), write_mask_(write_mask) {}
explicit Dest(OperandType type, uint32_t write_mask, Index index_1d,
Index index_2d, Index index_3d)
: OperandAddress(type, index_1d, index_2d, index_3d), : OperandAddress(type, index_1d, index_2d, index_3d),
write_mask_(write_mask) {} write_mask_(write_mask) {}
static Dest R(uint32_t index, uint32_t write_mask = 0b1111) { static Dest R(uint32_t index, uint32_t write_mask = 0b1111) {
return Dest(OperandType::kTemp, write_mask, index); return Dest(OperandType::kTemp, write_mask, index);
} }
static Dest V(uint32_t index, uint32_t read_mask = 0b1111) { static Dest V1D(uint32_t index, uint32_t read_mask = 0b1111) {
return Dest(OperandType::kInput, read_mask, index); return Dest(OperandType::kInput, read_mask, index);
} }
static Dest V2D(uint32_t index_1d, uint32_t index_2d,
uint32_t read_mask = 0b1111) {
return Dest(OperandType::kInput, read_mask, index_1d, index_2d);
}
static Dest O(Index index, uint32_t write_mask = 0b1111) { static Dest O(Index index, uint32_t write_mask = 0b1111) {
return Dest(OperandType::kOutput, write_mask, index); return Dest(OperandType::kOutput, write_mask, index);
} }
@ -915,11 +903,14 @@ struct Dest : OperandAddress {
} }
} }
[[nodiscard]] Dest Mask(uint32_t write_mask) const { [[nodiscard]] Dest Mask(uint32_t write_mask) const {
return Dest(type_, write_mask, index_1d_, index_2d_, index_3d_); Dest new_dest(*this);
new_dest.write_mask_ = write_mask;
return new_dest;
} }
[[nodiscard]] Dest MaskMasked(uint32_t write_mask) const { [[nodiscard]] Dest MaskMasked(uint32_t write_mask) const {
return Dest(type_, write_mask_ & write_mask, index_1d_, index_2d_, Dest new_dest(*this);
index_3d_); new_dest.write_mask_ &= write_mask;
return new_dest;
} }
static uint32_t GetMaskSingleComponent(uint32_t write_mask) { static uint32_t GetMaskSingleComponent(uint32_t write_mask) {
uint32_t component; uint32_t component;
@ -934,11 +925,9 @@ struct Dest : OperandAddress {
return GetMaskSingleComponent(GetMask(in_dcl)); return GetMaskSingleComponent(GetMask(in_dcl));
} }
uint32_t GetLength(bool in_dcl = false) const { uint32_t GetLength() const { return 1 + OperandAddress::GetLength(); }
return 1 + OperandAddress::GetLength(in_dcl);
}
void Write(std::vector<uint32_t>& code, bool in_dcl = false) const { void Write(std::vector<uint32_t>& code, bool in_dcl = false) const {
uint32_t operand_token = GetOperandTokenTypeAndIndex(in_dcl); uint32_t operand_token = GetOperandTokenTypeAndIndex();
OperandDimension dimension = GetDimension(in_dcl); OperandDimension dimension = GetDimension(in_dcl);
operand_token |= uint32_t(dimension); operand_token |= uint32_t(dimension);
if (dimension == OperandDimension::kVector) { if (dimension == OperandDimension::kVector) {
@ -947,7 +936,7 @@ struct Dest : OperandAddress {
(uint32_t(ComponentSelection::kMask) << 2) | (write_mask_ << 4); (uint32_t(ComponentSelection::kMask) << 2) | (write_mask_ << 4);
} }
code.push_back(operand_token); code.push_back(operand_token);
OperandAddress::Write(code, in_dcl); OperandAddress::Write(code);
} }
}; };
@ -962,18 +951,21 @@ struct Src : OperandAddress {
// Ignored for 0-component and 1-component operand types. // Ignored for 0-component and 1-component operand types.
uint32_t swizzle_; uint32_t swizzle_;
bool absolute_; bool absolute_ = false;
bool negate_; bool negate_ = false;
// Only valid for OperandType::kImmediate32. // Only valid for OperandType::kImmediate32.
uint32_t immediate_[4]; uint32_t immediate_[4];
explicit Src(OperandType type, uint32_t swizzle = kXYZW, explicit Src(OperandType type, uint32_t swizzle)
Index index_1d = Index(), Index index_2d = Index(), : OperandAddress(type), swizzle_(swizzle) {}
Index index_3d = Index()) explicit Src(OperandType type, uint32_t swizzle, Index index_1d)
: OperandAddress(type, index_1d, index_2d, index_3d), : OperandAddress(type, index_1d), swizzle_(swizzle) {}
swizzle_(swizzle), explicit Src(OperandType type, uint32_t swizzle, Index index_1d,
absolute_(false), Index index_2d)
negate_(false) {} : OperandAddress(type, index_1d, index_2d), swizzle_(swizzle) {}
explicit Src(OperandType type, uint32_t swizzle, Index index_1d,
Index index_2d, Index index_3d)
: OperandAddress(type, index_1d, index_2d, index_3d), swizzle_(swizzle) {}
// For creating instances for use in declarations. // For creating instances for use in declarations.
struct DclT {}; struct DclT {};
@ -982,9 +974,12 @@ struct Src : OperandAddress {
static Src R(uint32_t index, uint32_t swizzle = kXYZW) { static Src R(uint32_t index, uint32_t swizzle = kXYZW) {
return Src(OperandType::kTemp, swizzle, index); return Src(OperandType::kTemp, swizzle, index);
} }
static Src V(Index index, uint32_t swizzle = kXYZW) { static Src V1D(Index index, uint32_t swizzle = kXYZW) {
return Src(OperandType::kInput, swizzle, index); return Src(OperandType::kInput, swizzle, index);
} }
static Src V2D(Index index_1d, Index index_2d, uint32_t swizzle = kXYZW) {
return Src(OperandType::kInput, swizzle, index_1d, index_2d);
}
static Src X(uint32_t index_1d, Index index_2d, uint32_t swizzle = kXYZW) { static Src X(uint32_t index_1d, Index index_2d, uint32_t swizzle = kXYZW) {
return Src(OperandType::kIndexableTemp, swizzle, index_1d, index_2d); return Src(OperandType::kIndexableTemp, swizzle, index_1d, index_2d);
} }
@ -1108,15 +1103,14 @@ struct Src : OperandAddress {
return new_src; return new_src;
} }
uint32_t GetLength(uint32_t mask, bool force_vector = false, uint32_t GetLength(uint32_t mask, bool force_vector = false) const {
bool in_dcl = false) const {
bool is_vector = bool is_vector =
force_vector || force_vector ||
(mask != 0b0000 && Dest::GetMaskSingleComponent(mask) == UINT32_MAX); (mask != 0b0000 && Dest::GetMaskSingleComponent(mask) == UINT32_MAX);
if (type_ == OperandType::kImmediate32) { if (type_ == OperandType::kImmediate32) {
return is_vector ? 5 : 2; return is_vector ? 5 : 2;
} }
return ((absolute_ || negate_) ? 2 : 1) + OperandAddress::GetLength(in_dcl); return ((absolute_ || negate_) ? 2 : 1) + OperandAddress::GetLength();
} }
static constexpr uint32_t GetModifiedImmediate(uint32_t value, static constexpr uint32_t GetModifiedImmediate(uint32_t value,
bool is_integer, bool absolute, bool is_integer, bool absolute,
@ -1147,7 +1141,7 @@ struct Src : OperandAddress {
} }
void Write(std::vector<uint32_t>& code, bool is_integer, uint32_t mask, void Write(std::vector<uint32_t>& code, bool is_integer, uint32_t mask,
bool force_vector = false, bool in_dcl = false) const { bool force_vector = false, bool in_dcl = false) const {
uint32_t operand_token = GetOperandTokenTypeAndIndex(in_dcl); uint32_t operand_token = GetOperandTokenTypeAndIndex();
uint32_t mask_single_component = Dest::GetMaskSingleComponent(mask); uint32_t mask_single_component = Dest::GetMaskSingleComponent(mask);
uint32_t select_component = uint32_t select_component =
mask_single_component != UINT32_MAX ? mask_single_component : 0; mask_single_component != UINT32_MAX ? mask_single_component : 0;
@ -1220,7 +1214,7 @@ struct Src : OperandAddress {
code.push_back(uint32_t(ExtendedOperandType::kModifier) | code.push_back(uint32_t(ExtendedOperandType::kModifier) |
(uint32_t(modifier) << 6)); (uint32_t(modifier) << 6));
} }
OperandAddress::Write(code, in_dcl); OperandAddress::Write(code);
} }
} }
}; };
@ -1915,7 +1909,7 @@ class Assembler {
} }
void OpDclResource(ResourceDimension dimension, uint32_t return_type_token, void OpDclResource(ResourceDimension dimension, uint32_t return_type_token,
const Src& operand, uint32_t space = 0) { const Src& operand, uint32_t space = 0) {
uint32_t operands_length = operand.GetLength(0b1111, false, true); uint32_t operands_length = operand.GetLength(0b1111, false);
code_.reserve(code_.size() + 3 + operands_length); code_.reserve(code_.size() + 3 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclResource, 2 + operands_length) | code_.push_back(OpcodeToken(Opcode::kDclResource, 2 + operands_length) |
(uint32_t(dimension) << 11)); (uint32_t(dimension) << 11));
@ -1929,7 +1923,7 @@ class Assembler {
ConstantBufferAccessPattern access_pattern = ConstantBufferAccessPattern access_pattern =
ConstantBufferAccessPattern::kImmediateIndexed, ConstantBufferAccessPattern::kImmediateIndexed,
uint32_t space = 0) { uint32_t space = 0) {
uint32_t operands_length = operand.GetLength(0b1111, false, true); uint32_t operands_length = operand.GetLength(0b1111, false);
code_.reserve(code_.size() + 3 + operands_length); code_.reserve(code_.size() + 3 + operands_length);
code_.push_back( code_.push_back(
OpcodeToken(Opcode::kDclConstantBuffer, 2 + operands_length) | OpcodeToken(Opcode::kDclConstantBuffer, 2 + operands_length) |
@ -1941,7 +1935,7 @@ class Assembler {
void OpDclSampler(const Src& operand, void OpDclSampler(const Src& operand,
SamplerMode mode = SamplerMode::kDefault, SamplerMode mode = SamplerMode::kDefault,
uint32_t space = 0) { uint32_t space = 0) {
uint32_t operands_length = operand.GetLength(0b1111, false, true); uint32_t operands_length = operand.GetLength(0b1111, false);
code_.reserve(code_.size() + 2 + operands_length); code_.reserve(code_.size() + 2 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclSampler, 1 + operands_length) | code_.push_back(OpcodeToken(Opcode::kDclSampler, 1 + operands_length) |
(uint32_t(mode) << 11)); (uint32_t(mode) << 11));
@ -1949,14 +1943,14 @@ class Assembler {
code_.push_back(space); code_.push_back(space);
} }
void OpDclInput(const Dest& operand) { void OpDclInput(const Dest& operand) {
uint32_t operands_length = operand.GetLength(true); uint32_t operands_length = operand.GetLength();
code_.reserve(code_.size() + 1 + operands_length); code_.reserve(code_.size() + 1 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclInput, operands_length)); code_.push_back(OpcodeToken(Opcode::kDclInput, operands_length));
operand.Write(code_, true); operand.Write(code_, true);
++stat_.dcl_count; ++stat_.dcl_count;
} }
void OpDclInputSGV(const Dest& operand, Name name) { void OpDclInputSGV(const Dest& operand, Name name) {
uint32_t operands_length = operand.GetLength(true); uint32_t operands_length = operand.GetLength();
code_.reserve(code_.size() + 2 + operands_length); code_.reserve(code_.size() + 2 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclInputSGV, 1 + operands_length)); code_.push_back(OpcodeToken(Opcode::kDclInputSGV, 1 + operands_length));
operand.Write(code_, true); operand.Write(code_, true);
@ -1964,7 +1958,7 @@ class Assembler {
++stat_.dcl_count; ++stat_.dcl_count;
} }
void OpDclInputPS(InterpolationMode interpolation_mode, const Dest& operand) { void OpDclInputPS(InterpolationMode interpolation_mode, const Dest& operand) {
uint32_t operands_length = operand.GetLength(true); uint32_t operands_length = operand.GetLength();
code_.reserve(code_.size() + 1 + operands_length); code_.reserve(code_.size() + 1 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclInputPS, operands_length) | code_.push_back(OpcodeToken(Opcode::kDclInputPS, operands_length) |
(uint32_t(interpolation_mode) << 11)); (uint32_t(interpolation_mode) << 11));
@ -1972,7 +1966,7 @@ class Assembler {
++stat_.dcl_count; ++stat_.dcl_count;
} }
void OpDclInputPSSGV(const Dest& operand, Name name) { void OpDclInputPSSGV(const Dest& operand, Name name) {
uint32_t operands_length = operand.GetLength(true); uint32_t operands_length = operand.GetLength();
code_.reserve(code_.size() + 2 + operands_length); code_.reserve(code_.size() + 2 + operands_length);
// Constant interpolation mode is set in FXC output at least for // Constant interpolation mode is set in FXC output at least for
// SV_IsFrontFace, despite the comment in d3d12TokenizedProgramFormat.hpp // SV_IsFrontFace, despite the comment in d3d12TokenizedProgramFormat.hpp
@ -1985,7 +1979,7 @@ class Assembler {
} }
void OpDclInputPSSIV(InterpolationMode interpolation_mode, void OpDclInputPSSIV(InterpolationMode interpolation_mode,
const Dest& operand, Name name) { const Dest& operand, Name name) {
uint32_t operands_length = operand.GetLength(true); uint32_t operands_length = operand.GetLength();
code_.reserve(code_.size() + 2 + operands_length); code_.reserve(code_.size() + 2 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclInputPSSIV, 1 + operands_length) | code_.push_back(OpcodeToken(Opcode::kDclInputPSSIV, 1 + operands_length) |
(uint32_t(interpolation_mode) << 11)); (uint32_t(interpolation_mode) << 11));
@ -1994,14 +1988,14 @@ class Assembler {
++stat_.dcl_count; ++stat_.dcl_count;
} }
void OpDclOutput(const Dest& operand) { void OpDclOutput(const Dest& operand) {
uint32_t operands_length = operand.GetLength(true); uint32_t operands_length = operand.GetLength();
code_.reserve(code_.size() + 1 + operands_length); code_.reserve(code_.size() + 1 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclOutput, operands_length)); code_.push_back(OpcodeToken(Opcode::kDclOutput, operands_length));
operand.Write(code_, true); operand.Write(code_, true);
++stat_.dcl_count; ++stat_.dcl_count;
} }
void OpDclOutputSIV(const Dest& operand, Name name) { void OpDclOutputSIV(const Dest& operand, Name name) {
uint32_t operands_length = operand.GetLength(true); uint32_t operands_length = operand.GetLength();
code_.reserve(code_.size() + 2 + operands_length); code_.reserve(code_.size() + 2 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclOutputSIV, 1 + operands_length)); code_.push_back(OpcodeToken(Opcode::kDclOutputSIV, 1 + operands_length));
operand.Write(code_, true); operand.Write(code_, true);
@ -2124,7 +2118,7 @@ class Assembler {
void OpDclUnorderedAccessViewTyped(ResourceDimension dimension, void OpDclUnorderedAccessViewTyped(ResourceDimension dimension,
uint32_t flags, uint32_t return_type_token, uint32_t flags, uint32_t return_type_token,
const Src& operand, uint32_t space = 0) { const Src& operand, uint32_t space = 0) {
uint32_t operands_length = operand.GetLength(0b1111, false, true); uint32_t operands_length = operand.GetLength(0b1111, false);
code_.reserve(code_.size() + 3 + operands_length); code_.reserve(code_.size() + 3 + operands_length);
code_.push_back( code_.push_back(
OpcodeToken(Opcode::kDclUnorderedAccessViewTyped, 2 + operands_length) | OpcodeToken(Opcode::kDclUnorderedAccessViewTyped, 2 + operands_length) |
@ -2137,7 +2131,7 @@ class Assembler {
// kUAVFlagRasterizerOrderedAccess. // kUAVFlagRasterizerOrderedAccess.
void OpDclUnorderedAccessViewRaw(uint32_t flags, const Src& operand, void OpDclUnorderedAccessViewRaw(uint32_t flags, const Src& operand,
uint32_t space = 0) { uint32_t space = 0) {
uint32_t operands_length = operand.GetLength(0b1111, false, true); uint32_t operands_length = operand.GetLength(0b1111, false);
code_.reserve(code_.size() + 2 + operands_length); code_.reserve(code_.size() + 2 + operands_length);
code_.push_back( code_.push_back(
OpcodeToken(Opcode::kDclUnorderedAccessViewRaw, 1 + operands_length) | OpcodeToken(Opcode::kDclUnorderedAccessViewRaw, 1 + operands_length) |
@ -2146,7 +2140,7 @@ class Assembler {
code_.push_back(space); code_.push_back(space);
} }
void OpDclResourceRaw(const Src& operand, uint32_t space = 0) { void OpDclResourceRaw(const Src& operand, uint32_t space = 0) {
uint32_t operands_length = operand.GetLength(0b1111, false, true); uint32_t operands_length = operand.GetLength(0b1111, false);
code_.reserve(code_.size() + 2 + operands_length); code_.reserve(code_.size() + 2 + operands_length);
code_.push_back(OpcodeToken(Opcode::kDclResourceRaw, 1 + operands_length)); code_.push_back(OpcodeToken(Opcode::kDclResourceRaw, 1 + operands_length));
operand.Write(code_, true, 0b1111, false, true); operand.Write(code_, true, 0b1111, false, true);

View File

@ -326,15 +326,16 @@ void DxbcShaderTranslator::StartVertexShader_LoadVertexIndex() {
// Check if the closing vertex of a non-indexed line loop is being processed. // Check if the closing vertex of a non-indexed line loop is being processed.
a_.OpINE( a_.OpINE(
index_dest, index_dest,
dxbc::Src::V(uint32_t(InOutRegister::kVSInVertexIndex), dxbc::Src::kXXXX), dxbc::Src::V1D(uint32_t(InOutRegister::kVSInVertexIndex),
dxbc::Src::kXXXX),
LoadSystemConstant(SystemConstants::Index::kLineLoopClosingIndex, LoadSystemConstant(SystemConstants::Index::kLineLoopClosingIndex,
offsetof(SystemConstants, line_loop_closing_index), offsetof(SystemConstants, line_loop_closing_index),
dxbc::Src::kXXXX)); dxbc::Src::kXXXX));
// Zero the index if processing the closing vertex of a line loop, or do // Zero the index if processing the closing vertex of a line loop, or do
// nothing (replace 0 with 0) if not needed. // nothing (replace 0 with 0) if not needed.
a_.OpAnd( a_.OpAnd(index_dest,
index_dest, dxbc::Src::V1D(uint32_t(InOutRegister::kVSInVertexIndex),
dxbc::Src::V(uint32_t(InOutRegister::kVSInVertexIndex), dxbc::Src::kXXXX), dxbc::Src::kXXXX),
index_src); index_src);
{ {
@ -590,7 +591,7 @@ void DxbcShaderTranslator::StartPixelShader() {
// system_temp_depth_stencil_ before any return statement is possibly // system_temp_depth_stencil_ before any return statement is possibly
// reached. // reached.
assert_true(system_temp_depth_stencil_ != UINT32_MAX); assert_true(system_temp_depth_stencil_ != UINT32_MAX);
dxbc::Src in_position_z(dxbc::Src::V( dxbc::Src in_position_z(dxbc::Src::V1D(
uint32_t(InOutRegister::kPSInPosition), dxbc::Src::kZZZZ)); uint32_t(InOutRegister::kPSInPosition), dxbc::Src::kZZZZ));
in_position_used_ |= 0b0100; in_position_used_ |= 0b0100;
a_.OpDerivRTXCoarse(dxbc::Dest::R(system_temp_depth_stencil_, 0b0001), a_.OpDerivRTXCoarse(dxbc::Dest::R(system_temp_depth_stencil_, 0b0001),
@ -633,14 +634,14 @@ void DxbcShaderTranslator::StartPixelShader() {
// At center. // At center.
a_.OpMov(uses_register_dynamic_addressing ? dxbc::Dest::X(0, i) a_.OpMov(uses_register_dynamic_addressing ? dxbc::Dest::X(0, i)
: dxbc::Dest::R(i), : dxbc::Dest::R(i),
dxbc::Src::V(uint32_t(InOutRegister::kPSInInterpolators) + i)); dxbc::Src::V1D(uint32_t(InOutRegister::kPSInInterpolators) + i));
a_.OpElse(); a_.OpElse();
// At centroid. Not really important that 2x MSAA is emulated using // At centroid. Not really important that 2x MSAA is emulated using
// ForcedSampleCount 4 - what matters is that the sample position will // ForcedSampleCount 4 - what matters is that the sample position will
// be within the primitive, and the value will not be extrapolated. // be within the primitive, and the value will not be extrapolated.
a_.OpEvalCentroid( a_.OpEvalCentroid(
dxbc::Dest::R(centroid_register), dxbc::Dest::R(centroid_register),
dxbc::Src::V(uint32_t(InOutRegister::kPSInInterpolators) + i)); dxbc::Src::V1D(uint32_t(InOutRegister::kPSInInterpolators) + i));
if (uses_register_dynamic_addressing) { if (uses_register_dynamic_addressing) {
a_.OpMov(dxbc::Dest::X(0, i), dxbc::Src::R(centroid_register)); a_.OpMov(dxbc::Dest::X(0, i), dxbc::Src::R(centroid_register));
} }
@ -677,7 +678,7 @@ void DxbcShaderTranslator::StartPixelShader() {
// have correct derivative magnitude and LODs. // have correct derivative magnitude and LODs.
in_position_used_ |= 0b0011; in_position_used_ |= 0b0011;
a_.OpRoundNI(dxbc::Dest::R(param_gen_temp, 0b0011), a_.OpRoundNI(dxbc::Dest::R(param_gen_temp, 0b0011),
dxbc::Src::V(uint32_t(InOutRegister::kPSInPosition))); dxbc::Src::V1D(uint32_t(InOutRegister::kPSInPosition)));
uint32_t resolution_scaled_axes = uint32_t resolution_scaled_axes =
uint32_t(draw_resolution_scale_x_ > 1) | uint32_t(draw_resolution_scale_x_ > 1) |
(uint32_t(draw_resolution_scale_y_ > 1) << 1); (uint32_t(draw_resolution_scale_y_ > 1) << 1);
@ -701,9 +702,9 @@ void DxbcShaderTranslator::StartPixelShader() {
// Negate modifier flips the sign bit even for 0 - set it to minus for // Negate modifier flips the sign bit even for 0 - set it to minus for
// backfaces. // backfaces.
in_front_face_used_ = true; in_front_face_used_ = true;
a_.OpMovC( a_.OpMovC(dxbc::Dest::R(param_gen_temp, 0b0001),
dxbc::Dest::R(param_gen_temp, 0b0001), dxbc::Src::V1D(
dxbc::Src::V(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
dxbc::Src::kXXXX), dxbc::Src::kXXXX),
dxbc::Src::R(param_gen_temp, dxbc::Src::kXXXX), dxbc::Src::R(param_gen_temp, dxbc::Src::kXXXX),
-dxbc::Src::R(param_gen_temp, dxbc::Src::kXXXX)); -dxbc::Src::R(param_gen_temp, dxbc::Src::kXXXX));
@ -713,7 +714,7 @@ void DxbcShaderTranslator::StartPixelShader() {
// Saturate to avoid negative point coordinates if the center of the pixel // Saturate to avoid negative point coordinates if the center of the pixel
// is not covered, and extrapolation is done. // is not covered, and extrapolation is done.
a_.OpMov(dxbc::Dest::R(param_gen_temp, 0b1100), a_.OpMov(dxbc::Dest::R(param_gen_temp, 0b1100),
dxbc::Src::V(uint32_t(InOutRegister::kPSInPointParameters), dxbc::Src::V1D(uint32_t(InOutRegister::kPSInPointParameters),
0b0100 << 4), 0b0100 << 4),
true); true);
// Primitive type. // Primitive type.
@ -3499,7 +3500,7 @@ void DxbcShaderTranslator::WriteShaderCode() {
if (register_count()) { if (register_count()) {
// Unswapped vertex index input (only X component). // Unswapped vertex index input (only X component).
ao_.OpDclInputSGV( ao_.OpDclInputSGV(
dxbc::Dest::V(uint32_t(InOutRegister::kVSInVertexIndex), 0b0001), dxbc::Dest::V1D(uint32_t(InOutRegister::kVSInVertexIndex), 0b0001),
dxbc::Name::kVertexID); dxbc::Name::kVertexID);
} }
} }
@ -3537,13 +3538,13 @@ void DxbcShaderTranslator::WriteShaderCode() {
for (uint32_t i = 0; i < interpolator_count; ++i) { for (uint32_t i = 0; i < interpolator_count; ++i) {
ao_.OpDclInputPS( ao_.OpDclInputPS(
dxbc::InterpolationMode::kLinear, dxbc::InterpolationMode::kLinear,
dxbc::Dest::V(uint32_t(InOutRegister::kPSInInterpolators) + i)); dxbc::Dest::V1D(uint32_t(InOutRegister::kPSInInterpolators) + i));
} }
if (register_count()) { if (register_count()) {
// Point parameters input (only coordinates, not size, needed). // Point parameters input (only coordinates, not size, needed).
ao_.OpDclInputPS( ao_.OpDclInputPS(
dxbc::InterpolationMode::kLinear, dxbc::InterpolationMode::kLinear,
dxbc::Dest::V(uint32_t(InOutRegister::kPSInPointParameters), dxbc::Dest::V1D(uint32_t(InOutRegister::kPSInPointParameters),
0b0011)); 0b0011));
} }
} }
@ -3560,7 +3561,7 @@ void DxbcShaderTranslator::WriteShaderCode() {
(is_writing_float24_depth && !shader_writes_depth) (is_writing_float24_depth && !shader_writes_depth)
? dxbc::InterpolationMode::kLinearNoPerspectiveSample ? dxbc::InterpolationMode::kLinearNoPerspectiveSample
: dxbc::InterpolationMode::kLinearNoPerspective, : dxbc::InterpolationMode::kLinearNoPerspective,
dxbc::Dest::V(uint32_t(InOutRegister::kPSInPosition), dxbc::Dest::V1D(uint32_t(InOutRegister::kPSInPosition),
in_position_used_), in_position_used_),
dxbc::Name::kPosition); dxbc::Name::kPosition);
} }
@ -3575,7 +3576,7 @@ void DxbcShaderTranslator::WriteShaderCode() {
if (front_face_and_sample_index_mask) { if (front_face_and_sample_index_mask) {
// Is front face, sample index. // Is front face, sample index.
ao_.OpDclInputPSSGV( ao_.OpDclInputPSSGV(
dxbc::Dest::V(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), dxbc::Dest::V1D(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
front_face_and_sample_index_mask), front_face_and_sample_index_mask),
dxbc::Name::kIsFrontFace); dxbc::Name::kIsFrontFace);
} }

View File

@ -139,7 +139,7 @@ void DxbcShaderTranslator::ExportToMemory() {
in_position_used_ |= resolution_scaled_axes; in_position_used_ |= resolution_scaled_axes;
a_.OpFToU( a_.OpFToU(
dxbc::Dest::R(control_temp, resolution_scaled_axes << 1), dxbc::Dest::R(control_temp, resolution_scaled_axes << 1),
dxbc::Src::V(uint32_t(InOutRegister::kPSInPosition), 0b0100 << 2)); dxbc::Src::V1D(uint32_t(InOutRegister::kPSInPosition), 0b0100 << 2));
dxbc::Dest resolution_scaling_temp_dest( dxbc::Dest resolution_scaling_temp_dest(
dxbc::Dest::R(control_temp, 0b1000)); dxbc::Dest::R(control_temp, 0b1000));
dxbc::Src resolution_scaling_temp_src( dxbc::Src resolution_scaling_temp_src(
@ -201,7 +201,7 @@ void DxbcShaderTranslator::ExportToMemory() {
a_.OpIEq( a_.OpIEq(
dxbc::Dest::R(control_temp, dxbc::Dest::R(control_temp,
inner_condition_provided ? 0b0010 : 0b0001), inner_condition_provided ? 0b0010 : 0b0001),
dxbc::Src::V(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), dxbc::Src::V1D(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
dxbc::Src::kYYYY), dxbc::Src::kYYYY),
dxbc::Src::R(control_temp, dxbc::Src::kYYYY)); dxbc::Src::R(control_temp, dxbc::Src::kYYYY));
if (inner_condition_provided) { if (inner_condition_provided) {

View File

@ -172,7 +172,7 @@ void DxbcShaderTranslator::StartPixelShader_LoadROVParameters() {
// system_temp_rov_params_.y = Y host pixel position as uint // system_temp_rov_params_.y = Y host pixel position as uint
in_position_used_ |= 0b0011; in_position_used_ |= 0b0011;
a_.OpFToU(dxbc::Dest::R(system_temp_rov_params_, 0b0011), a_.OpFToU(dxbc::Dest::R(system_temp_rov_params_, 0b0011),
dxbc::Src::V(uint32_t(InOutRegister::kPSInPosition))); dxbc::Src::V1D(uint32_t(InOutRegister::kPSInPosition)));
// Convert the position from pixels to samples. // Convert the position from pixels to samples.
// system_temp_rov_params_.x = X sample 0 position // system_temp_rov_params_.x = X sample 0 position
// system_temp_rov_params_.y = Y sample 0 position // system_temp_rov_params_.y = Y sample 0 position
@ -605,8 +605,8 @@ void DxbcShaderTranslator::ROV_DepthStencilTest() {
ROV_DepthTo24Bit(system_temp_depth_stencil_, 0, system_temp_depth_stencil_, ROV_DepthTo24Bit(system_temp_depth_stencil_, 0, system_temp_depth_stencil_,
0, temp, 0); 0, temp, 0);
} else { } else {
dxbc::Src in_position_z( dxbc::Src in_position_z(dxbc::Src::V1D(
dxbc::Src::V(uint32_t(InOutRegister::kPSInPosition), dxbc::Src::kZZZZ)); uint32_t(InOutRegister::kPSInPosition), dxbc::Src::kZZZZ));
// Get the derivatives of the screen-space (but not clamped to the viewport // Get the derivatives of the screen-space (but not clamped to the viewport
// depth bounds yet - this happens after the pixel shader in Direct3D 11+; // depth bounds yet - this happens after the pixel shader in Direct3D 11+;
// also linear within the triangle - thus constant derivatives along the // also linear within the triangle - thus constant derivatives along the
@ -645,8 +645,8 @@ void DxbcShaderTranslator::ROV_DepthStencilTest() {
a_.OpMax(temp_z_dest, z_ddx_src.Abs(), z_ddy_src.Abs()); a_.OpMax(temp_z_dest, z_ddx_src.Abs(), z_ddy_src.Abs());
// Calculate the depth bias for the needed faceness. // Calculate the depth bias for the needed faceness.
in_front_face_used_ = true; in_front_face_used_ = true;
a_.OpIf(true, a_.OpIf(true, dxbc::Src::V1D(
dxbc::Src::V(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
dxbc::Src::kXXXX)); dxbc::Src::kXXXX));
// temp.x if early = ddx(z) // temp.x if early = ddx(z)
// temp.y if early = ddy(z) // temp.y if early = ddy(z)
@ -949,7 +949,7 @@ void DxbcShaderTranslator::ROV_DepthStencilTest() {
{ {
// Check the current face to get the reference and apply the read mask. // Check the current face to get the reference and apply the read mask.
in_front_face_used_ = true; in_front_face_used_ = true;
a_.OpIf(true, dxbc::Src::V( a_.OpIf(true, dxbc::Src::V1D(
uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
dxbc::Src::kXXXX)); dxbc::Src::kXXXX));
for (uint32_t j = 0; j < 2; ++j) { for (uint32_t j = 0; j < 2; ++j) {
@ -1012,7 +1012,7 @@ void DxbcShaderTranslator::ROV_DepthStencilTest() {
in_front_face_used_ = true; in_front_face_used_ = true;
a_.OpMovC( a_.OpMovC(
sample_temp_z_dest, sample_temp_z_dest,
dxbc::Src::V(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), dxbc::Src::V1D(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
dxbc::Src::kXXXX), dxbc::Src::kXXXX),
LoadSystemConstant( LoadSystemConstant(
SystemConstants::Index::kEdramStencil, SystemConstants::Index::kEdramStencil,
@ -1090,9 +1090,9 @@ void DxbcShaderTranslator::ROV_DepthStencilTest() {
// Replace. // Replace.
a_.OpCase(dxbc::Src::LU(uint32_t(xenos::StencilOp::kReplace))); a_.OpCase(dxbc::Src::LU(uint32_t(xenos::StencilOp::kReplace)));
in_front_face_used_ = true; in_front_face_used_ = true;
a_.OpMovC( a_.OpMovC(sample_temp_y_dest,
sample_temp_y_dest, dxbc::Src::V1D(
dxbc::Src::V(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
dxbc::Src::kXXXX), dxbc::Src::kXXXX),
LoadSystemConstant( LoadSystemConstant(
SystemConstants::Index::kEdramStencil, SystemConstants::Index::kEdramStencil,
@ -1155,7 +1155,7 @@ void DxbcShaderTranslator::ROV_DepthStencilTest() {
in_front_face_used_ = true; in_front_face_used_ = true;
a_.OpMovC( a_.OpMovC(
sample_temp_z_dest, sample_temp_z_dest,
dxbc::Src::V(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex), dxbc::Src::V1D(uint32_t(InOutRegister::kPSInFrontFaceAndSampleIndex),
dxbc::Src::kXXXX), dxbc::Src::kXXXX),
LoadSystemConstant( LoadSystemConstant(
SystemConstants::Index::kEdramStencil, SystemConstants::Index::kEdramStencil,
@ -1924,9 +1924,9 @@ void DxbcShaderTranslator::CompletePixelShader_DSV_DepthTo24Bit() {
// assumption of it being clamped while working with the bit representation. // assumption of it being clamped while working with the bit representation.
temp = PushSystemTemp(); temp = PushSystemTemp();
in_position_used_ |= 0b0100; in_position_used_ |= 0b0100;
a_.OpMul( a_.OpMul(dxbc::Dest::R(temp, 0b0001),
dxbc::Dest::R(temp, 0b0001), dxbc::Src::V1D(uint32_t(InOutRegister::kPSInPosition),
dxbc::Src::V(uint32_t(InOutRegister::kPSInPosition), dxbc::Src::kZZZZ), dxbc::Src::kZZZZ),
dxbc::Src::LF(2.0f), true); dxbc::Src::LF(2.0f), true);
} }
@ -2068,7 +2068,7 @@ void DxbcShaderTranslator::CompletePixelShader_AlphaToMask() {
// temp.x = alpha to coverage offset as float 0.0...3.0. // temp.x = alpha to coverage offset as float 0.0...3.0.
in_position_used_ |= 0b0011; in_position_used_ |= 0b0011;
a_.OpFToU(dxbc::Dest::R(temp, 0b0011), a_.OpFToU(dxbc::Dest::R(temp, 0b0011),
dxbc::Src::V(uint32_t(InOutRegister::kPSInPosition))); dxbc::Src::V1D(uint32_t(InOutRegister::kPSInPosition)));
a_.OpAnd(dxbc::Dest::R(temp, 0b0010), dxbc::Src::R(temp, dxbc::Src::kYYYY), a_.OpAnd(dxbc::Dest::R(temp, 0b0010), dxbc::Src::R(temp, dxbc::Src::kYYYY),
dxbc::Src::LU(1)); dxbc::Src::LU(1));
a_.OpBFI(temp_x_dest, dxbc::Src::LU(1), dxbc::Src::LU(1), temp_x_src, a_.OpBFI(temp_x_dest, dxbc::Src::LU(1), dxbc::Src::LU(1), temp_x_src,