Merge branch 'master' into vulkan
This commit is contained in:
commit
90432cd004
|
@ -1822,13 +1822,13 @@ bool D3D12CommandProcessor::IssueDraw(xenos::PrimitiveType primitive_type,
|
||||||
uint32_t index_count,
|
uint32_t index_count,
|
||||||
IndexBufferInfo* index_buffer_info,
|
IndexBufferInfo* index_buffer_info,
|
||||||
bool major_mode_explicit) {
|
bool major_mode_explicit) {
|
||||||
auto device = GetD3D12Context().GetD3D12Provider().GetDevice();
|
|
||||||
auto& regs = *register_file_;
|
|
||||||
|
|
||||||
#if XE_UI_D3D12_FINE_GRAINED_DRAW_SCOPES
|
#if XE_UI_D3D12_FINE_GRAINED_DRAW_SCOPES
|
||||||
SCOPE_profile_cpu_f("gpu");
|
SCOPE_profile_cpu_f("gpu");
|
||||||
#endif // XE_UI_D3D12_FINE_GRAINED_DRAW_SCOPES
|
#endif // XE_UI_D3D12_FINE_GRAINED_DRAW_SCOPES
|
||||||
|
|
||||||
|
ID3D12Device* device = GetD3D12Context().GetD3D12Provider().GetDevice();
|
||||||
|
const RegisterFile& regs = *register_file_;
|
||||||
|
|
||||||
xenos::ModeControl edram_mode = regs.Get<reg::RB_MODECONTROL>().edram_mode;
|
xenos::ModeControl edram_mode = regs.Get<reg::RB_MODECONTROL>().edram_mode;
|
||||||
if (edram_mode == xenos::ModeControl::kCopy) {
|
if (edram_mode == xenos::ModeControl::kCopy) {
|
||||||
// Special copy handling.
|
// Special copy handling.
|
||||||
|
@ -3241,9 +3241,10 @@ void D3D12CommandProcessor::UpdateSystemConstantValues(
|
||||||
poly_offset_back_offset = poly_offset_front_offset;
|
poly_offset_back_offset = poly_offset_front_offset;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
// "slope computed in subpixels ([...] 1/16)" - R5xx Acceleration.
|
float poly_offset_scale_factor =
|
||||||
poly_offset_front_scale *= (1.0f / 16.0f) * resolution_scale;
|
xenos::kPolygonOffsetScaleSubpixelUnit * resolution_scale;
|
||||||
poly_offset_back_scale *= (1.0f / 16.0f) * resolution_scale;
|
poly_offset_front_scale *= poly_offset_scale_factor;
|
||||||
|
poly_offset_back_scale *= poly_offset_scale_factor;
|
||||||
dirty |= system_constants_.edram_poly_offset_front_scale !=
|
dirty |= system_constants_.edram_poly_offset_front_scale !=
|
||||||
poly_offset_front_scale;
|
poly_offset_front_scale;
|
||||||
system_constants_.edram_poly_offset_front_scale = poly_offset_front_scale;
|
system_constants_.edram_poly_offset_front_scale = poly_offset_front_scale;
|
||||||
|
|
|
@ -36,6 +36,7 @@
|
||||||
#include "xenia/gpu/d3d12/d3d12_render_target_cache.h"
|
#include "xenia/gpu/d3d12/d3d12_render_target_cache.h"
|
||||||
#include "xenia/gpu/draw_util.h"
|
#include "xenia/gpu/draw_util.h"
|
||||||
#include "xenia/gpu/gpu_flags.h"
|
#include "xenia/gpu/gpu_flags.h"
|
||||||
|
#include "xenia/gpu/xenos.h"
|
||||||
#include "xenia/ui/d3d12/d3d12_util.h"
|
#include "xenia/ui/d3d12/d3d12_util.h"
|
||||||
|
|
||||||
DEFINE_bool(d3d12_dxbc_disasm, false,
|
DEFINE_bool(d3d12_dxbc_disasm, false,
|
||||||
|
@ -1340,7 +1341,6 @@ bool PipelineCache::GetCurrentStateDescription(
|
||||||
break;
|
break;
|
||||||
case xenos::PrimitiveType::kLineList:
|
case xenos::PrimitiveType::kLineList:
|
||||||
case xenos::PrimitiveType::kLineStrip:
|
case xenos::PrimitiveType::kLineStrip:
|
||||||
case xenos::PrimitiveType::kLineLoop:
|
|
||||||
// Quads are emulated as line lists with adjacency.
|
// Quads are emulated as line lists with adjacency.
|
||||||
case xenos::PrimitiveType::kQuadList:
|
case xenos::PrimitiveType::kQuadList:
|
||||||
case xenos::PrimitiveType::k2DLineStrip:
|
case xenos::PrimitiveType::k2DLineStrip:
|
||||||
|
@ -1457,7 +1457,7 @@ bool PipelineCache::GetCurrentStateDescription(
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if (!edram_rov_used) {
|
if (!edram_rov_used) {
|
||||||
float poly_offset_host_scale = draw_util::GetD3D10PolygonOffsetScale(
|
float poly_offset_host_scale = draw_util::GetD3D10PolygonOffsetFactor(
|
||||||
regs.Get<reg::RB_DEPTH_INFO>().depth_format, true);
|
regs.Get<reg::RB_DEPTH_INFO>().depth_format, true);
|
||||||
// Using ceil here just in case a game wants the offset but passes a value
|
// Using ceil here just in case a game wants the offset but passes a value
|
||||||
// that is too small - it's better to apply more offset than to make depth
|
// that is too small - it's better to apply more offset than to make depth
|
||||||
|
@ -1468,7 +1468,7 @@ bool PipelineCache::GetCurrentStateDescription(
|
||||||
(poly_offset < 0.0f ? -1 : 1);
|
(poly_offset < 0.0f ? -1 : 1);
|
||||||
// "slope computed in subpixels ([...] 1/16)" - R5xx Acceleration.
|
// "slope computed in subpixels ([...] 1/16)" - R5xx Acceleration.
|
||||||
description_out.depth_bias_slope_scaled =
|
description_out.depth_bias_slope_scaled =
|
||||||
poly_offset_scale * (1.0f / 16.0f);
|
poly_offset_scale * xenos::kPolygonOffsetScaleSubpixelUnit;
|
||||||
}
|
}
|
||||||
if (tessellated && cvars::d3d12_tessellation_wireframe) {
|
if (tessellated && cvars::d3d12_tessellation_wireframe) {
|
||||||
description_out.fill_mode_wireframe = 1;
|
description_out.fill_mode_wireframe = 1;
|
||||||
|
|
|
@ -106,7 +106,7 @@ inline reg::RB_DEPTHCONTROL GetDepthControlForCurrentEdramMode(
|
||||||
return regs.Get<reg::RB_DEPTHCONTROL>();
|
return regs.Get<reg::RB_DEPTHCONTROL>();
|
||||||
}
|
}
|
||||||
|
|
||||||
constexpr float GetD3D10PolygonOffsetScale(
|
constexpr float GetD3D10PolygonOffsetFactor(
|
||||||
xenos::DepthRenderTargetFormat depth_format, bool float24_as_0_to_0_5) {
|
xenos::DepthRenderTargetFormat depth_format, bool float24_as_0_to_0_5) {
|
||||||
if (depth_format == xenos::DepthRenderTargetFormat::kD24S8) {
|
if (depth_format == xenos::DepthRenderTargetFormat::kD24S8) {
|
||||||
return float(1 << 24);
|
return float(1 << 24);
|
||||||
|
|
|
@ -458,6 +458,15 @@ bool PrimitiveProcessor::Process(ProcessingResult& result_out) {
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
if (regs.Get<reg::PA_SU_SC_MODE_CNTL>().multi_prim_ib_ena) {
|
if (regs.Get<reg::PA_SU_SC_MODE_CNTL>().multi_prim_ib_ena) {
|
||||||
|
switch (guest_primitive_type) {
|
||||||
|
case xenos::PrimitiveType::kLineStrip:
|
||||||
|
case xenos::PrimitiveType::kTriangleFan:
|
||||||
|
case xenos::PrimitiveType::kTriangleStrip:
|
||||||
|
case xenos::PrimitiveType::kLineLoop:
|
||||||
|
case xenos::PrimitiveType::kQuadStrip:
|
||||||
|
case xenos::PrimitiveType::kPolygon:
|
||||||
|
case xenos::PrimitiveType::k2DLineStrip:
|
||||||
|
case xenos::PrimitiveType::k2DTriStrip:
|
||||||
guest_primitive_reset_index_guest_endian = xenos::GpuSwap(
|
guest_primitive_reset_index_guest_endian = xenos::GpuSwap(
|
||||||
regs.Get<reg::VGT_MULTI_PRIM_IB_RESET_INDX>().reset_indx,
|
regs.Get<reg::VGT_MULTI_PRIM_IB_RESET_INDX>().reset_indx,
|
||||||
guest_index_endian);
|
guest_index_endian);
|
||||||
|
@ -468,6 +477,15 @@ bool PrimitiveProcessor::Process(ProcessingResult& result_out) {
|
||||||
guest_index_format == xenos::IndexFormat::kInt16
|
guest_index_format == xenos::IndexFormat::kInt16
|
||||||
? guest_primitive_reset_index_guest_endian <= UINT16_MAX
|
? guest_primitive_reset_index_guest_endian <= UINT16_MAX
|
||||||
: true;
|
: true;
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
// Vulkan explicitly disallows primitive restart index for "list"
|
||||||
|
// topologies. In Direct3D 12, it's valid for non-strips, but has
|
||||||
|
// implementation-defined behavior. Make backend usage simpler by
|
||||||
|
// explicitly filtering lists out, and hope the guest never uses
|
||||||
|
// primitive reset for lists.
|
||||||
|
break;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -138,7 +138,8 @@ class PrimitiveProcessor {
|
||||||
xenos::IndexFormat host_index_format;
|
xenos::IndexFormat host_index_format;
|
||||||
xenos::Endian host_index_endian;
|
xenos::Endian host_index_endian;
|
||||||
// The reset index, if enabled, is always 0xFFFF for host_index_format
|
// The reset index, if enabled, is always 0xFFFF for host_index_format
|
||||||
// kInt16 and 0xFFFFFFFF for kInt32.
|
// kInt16 and 0xFFFFFFFF for kInt32. Never enabled for "list" primitive
|
||||||
|
// types, thus safe for direct usage on Vulkan.
|
||||||
bool host_primitive_reset_enabled;
|
bool host_primitive_reset_enabled;
|
||||||
// Backend-specific handle for the index buffer valid for the current draw,
|
// Backend-specific handle for the index buffer valid for the current draw,
|
||||||
// only valid for index_buffer_type kHostConverted and kHostBuiltin.
|
// only valid for index_buffer_type kHostConverted and kHostBuiltin.
|
||||||
|
|
|
@ -347,6 +347,16 @@ constexpr float UNorm24To32(uint32_t n24) {
|
||||||
return float(n24 + (n24 >> 23)) * (1.0f / float(1 << 24));
|
return float(n24 + (n24 >> 23)) * (1.0f / float(1 << 24));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Scale for conversion of slope scales from PA_SU_POLY_OFFSET_FRONT/BACK_SCALE
|
||||||
|
// units to those used when the slope is computed from the difference between
|
||||||
|
// adjacent pixels, for conversion from the guest to common host APIs or to
|
||||||
|
// calculation using max(|ddx(z)|, |ddy(z)|).
|
||||||
|
// "slope computed in subpixels (1/12 or 1/16)" - R5xx Acceleration.
|
||||||
|
// But the correct scale for conversion of the slope scale from subpixels to
|
||||||
|
// pixels is likely 1/16 according to:
|
||||||
|
// https://github.com/mesa3d/mesa/blob/54ad9b444c8e73da498211870e785239ad3ff1aa/src/gallium/drivers/radeonsi/si_state.c#L946
|
||||||
|
constexpr float kPolygonOffsetScaleSubpixelUnit = 1.0f / 16.0f;
|
||||||
|
|
||||||
constexpr uint32_t kColorRenderTargetFormatBits = 4;
|
constexpr uint32_t kColorRenderTargetFormatBits = 4;
|
||||||
constexpr uint32_t kDepthRenderTargetFormatBits = 1;
|
constexpr uint32_t kDepthRenderTargetFormatBits = 1;
|
||||||
constexpr uint32_t kRenderTargetFormatBits =
|
constexpr uint32_t kRenderTargetFormatBits =
|
||||||
|
|
Loading…
Reference in New Issue