[D3D12] Use 3/4 of logical cores for pipeline creation, cleanup pipeline log messages
This commit is contained in:
parent
890228b6f3
commit
1523a1f662
|
@ -29,6 +29,12 @@
|
||||||
|
|
||||||
DEFINE_bool(d3d12_dxbc_disasm, false,
|
DEFINE_bool(d3d12_dxbc_disasm, false,
|
||||||
"Disassemble DXBC shaders after generation.");
|
"Disassemble DXBC shaders after generation.");
|
||||||
|
DEFINE_int32(
|
||||||
|
d3d12_pipeline_creation_threads, -1,
|
||||||
|
"Number of threads used for graphics pipeline state creation. -1 to "
|
||||||
|
"calculate automatically (75% of logical CPU cores), 1-16 to specify the "
|
||||||
|
"number of threads explicitly, 0 to disable multithreaded pipeline state "
|
||||||
|
"creation.");
|
||||||
DEFINE_bool(
|
DEFINE_bool(
|
||||||
d3d12_tessellation_adaptive, false,
|
d3d12_tessellation_adaptive, false,
|
||||||
"Allow games to use adaptive tessellation - may be disabled if the game "
|
"Allow games to use adaptive tessellation - may be disabled if the game "
|
||||||
|
@ -68,17 +74,25 @@ PipelineCache::PipelineCache(D3D12CommandProcessor* command_processor,
|
||||||
depth_only_pixel_shader_ =
|
depth_only_pixel_shader_ =
|
||||||
std::move(shader_translator_->CreateDepthOnlyPixelShader());
|
std::move(shader_translator_->CreateDepthOnlyPixelShader());
|
||||||
}
|
}
|
||||||
|
|
||||||
creation_completion_event_ =
|
|
||||||
xe::threading::Event::CreateManualResetEvent(true);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
PipelineCache::~PipelineCache() { Shutdown(); }
|
PipelineCache::~PipelineCache() { Shutdown(); }
|
||||||
|
|
||||||
bool PipelineCache::Initialize() {
|
bool PipelineCache::Initialize() {
|
||||||
|
if (FLAGS_d3d12_pipeline_creation_threads != 0) {
|
||||||
creation_threads_busy_ = 0;
|
creation_threads_busy_ = 0;
|
||||||
|
creation_completion_event_ =
|
||||||
|
xe::threading::Event::CreateManualResetEvent(true);
|
||||||
creation_completion_set_event_ = false;
|
creation_completion_set_event_ = false;
|
||||||
creation_threads_shutdown_ = false;
|
creation_threads_shutdown_ = false;
|
||||||
|
uint32_t creation_thread_count;
|
||||||
|
if (FLAGS_d3d12_pipeline_creation_threads < 0) {
|
||||||
|
creation_thread_count = std::max(
|
||||||
|
xe::threading::logical_processor_count() * 3 / 4, uint32_t(1));
|
||||||
|
} else {
|
||||||
|
creation_thread_count = uint32_t(FLAGS_d3d12_pipeline_creation_threads);
|
||||||
|
}
|
||||||
|
creation_thread_count = std::min(creation_thread_count, uint32_t(16));
|
||||||
// TODO(Triang3l): Change the thread count to something non-fixed (3 is just
|
// TODO(Triang3l): Change the thread count to something non-fixed (3 is just
|
||||||
// for testing).
|
// for testing).
|
||||||
for (uint32_t i = 0; i < 3; ++i) {
|
for (uint32_t i = 0; i < 3; ++i) {
|
||||||
|
@ -87,6 +101,7 @@ bool PipelineCache::Initialize() {
|
||||||
creation_thread->set_name("D3D12 Pipelines");
|
creation_thread->set_name("D3D12 Pipelines");
|
||||||
creation_threads_.push_back(std::move(creation_thread));
|
creation_threads_.push_back(std::move(creation_thread));
|
||||||
}
|
}
|
||||||
|
}
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -94,6 +109,7 @@ void PipelineCache::Shutdown() {
|
||||||
ClearCache();
|
ClearCache();
|
||||||
|
|
||||||
// Shut down all threads.
|
// Shut down all threads.
|
||||||
|
if (!creation_threads_.empty()) {
|
||||||
{
|
{
|
||||||
std::lock_guard<std::mutex> lock(creation_request_lock_);
|
std::lock_guard<std::mutex> lock(creation_request_lock_);
|
||||||
creation_threads_shutdown_ = true;
|
creation_threads_shutdown_ = true;
|
||||||
|
@ -103,12 +119,15 @@ void PipelineCache::Shutdown() {
|
||||||
xe::threading::Wait(creation_threads_[i].get(), false);
|
xe::threading::Wait(creation_threads_[i].get(), false);
|
||||||
}
|
}
|
||||||
creation_threads_.clear();
|
creation_threads_.clear();
|
||||||
|
creation_completion_event_.reset();
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void PipelineCache::ClearCache() {
|
void PipelineCache::ClearCache() {
|
||||||
// Remove references to the current pipeline.
|
// Remove references to the current pipeline.
|
||||||
current_pipeline_ = nullptr;
|
current_pipeline_ = nullptr;
|
||||||
|
|
||||||
|
if (!creation_threads_.empty()) {
|
||||||
// Empty the pipeline creation queue.
|
// Empty the pipeline creation queue.
|
||||||
{
|
{
|
||||||
std::lock_guard<std::mutex> lock(creation_request_lock_);
|
std::lock_guard<std::mutex> lock(creation_request_lock_);
|
||||||
|
@ -116,6 +135,7 @@ void PipelineCache::ClearCache() {
|
||||||
creation_completion_set_event_ = true;
|
creation_completion_set_event_ = true;
|
||||||
}
|
}
|
||||||
creation_request_cond_.notify_one();
|
creation_request_cond_.notify_one();
|
||||||
|
}
|
||||||
|
|
||||||
// Destroy all pipelines.
|
// Destroy all pipelines.
|
||||||
for (auto it : pipelines_) {
|
for (auto it : pipelines_) {
|
||||||
|
@ -133,6 +153,7 @@ void PipelineCache::ClearCache() {
|
||||||
}
|
}
|
||||||
|
|
||||||
void PipelineCache::EndFrame() {
|
void PipelineCache::EndFrame() {
|
||||||
|
if (!creation_threads_.empty()) {
|
||||||
// Await creation of all queued pipelines.
|
// Await creation of all queued pipelines.
|
||||||
bool await_event = false;
|
bool await_event = false;
|
||||||
{
|
{
|
||||||
|
@ -147,6 +168,7 @@ void PipelineCache::EndFrame() {
|
||||||
xe::threading::Wait(creation_completion_event_.get(), false);
|
xe::threading::Wait(creation_completion_event_.get(), false);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
D3D12Shader* PipelineCache::LoadShader(ShaderType shader_type,
|
D3D12Shader* PipelineCache::LoadShader(ShaderType shader_type,
|
||||||
uint32_t guest_address,
|
uint32_t guest_address,
|
||||||
|
@ -237,7 +259,6 @@ bool PipelineCache::ConfigurePipeline(
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#if 1
|
|
||||||
if (!EnsureShadersTranslated(vertex_shader, pixel_shader, primitive_type)) {
|
if (!EnsureShadersTranslated(vertex_shader, pixel_shader, primitive_type)) {
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
@ -248,37 +269,16 @@ bool PipelineCache::ConfigurePipeline(
|
||||||
pipelines_.insert(std::make_pair(hash, new_pipeline));
|
pipelines_.insert(std::make_pair(hash, new_pipeline));
|
||||||
COUNT_profile_set("gpu/pipeline_cache/pipelines", pipelines_.size());
|
COUNT_profile_set("gpu/pipeline_cache/pipelines", pipelines_.size());
|
||||||
|
|
||||||
|
if (!creation_threads_.empty()) {
|
||||||
// Submit the pipeline for creation to any available thread.
|
// Submit the pipeline for creation to any available thread.
|
||||||
{
|
{
|
||||||
std::lock_guard<std::mutex> lock(creation_request_lock_);
|
std::lock_guard<std::mutex> lock(creation_request_lock_);
|
||||||
creation_queue_.push_back(new_pipeline);
|
creation_queue_.push_back(new_pipeline);
|
||||||
}
|
}
|
||||||
creation_request_cond_.notify_one();
|
creation_request_cond_.notify_one();
|
||||||
#else
|
|
||||||
// Create a new pipeline if not found and add it to the cache.
|
|
||||||
if (pixel_shader != nullptr) {
|
|
||||||
XELOGGPU("Creating pipeline %.16" PRIX64 ", VS %.16" PRIX64
|
|
||||||
", PS %.16" PRIX64,
|
|
||||||
hash, vertex_shader->ucode_data_hash(),
|
|
||||||
pixel_shader->ucode_data_hash());
|
|
||||||
} else {
|
} else {
|
||||||
XELOGGPU("Creating pipeline %.16" PRIX64 ", VS %.16" PRIX64, hash,
|
new_pipeline->state = CreatePipelineState(description);
|
||||||
vertex_shader->ucode_data_hash());
|
|
||||||
}
|
}
|
||||||
if (!EnsureShadersTranslated(vertex_shader, pixel_shader, primitive_type)) {
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
ID3D12PipelineState* new_state = CreatePipelineState(description);
|
|
||||||
if (!new_state) {
|
|
||||||
XELOGE("Failed to create pipeline %.16" PRIX64, hash);
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
Pipeline* new_pipeline = new Pipeline;
|
|
||||||
new_pipeline->state = new_state;
|
|
||||||
std::memcpy(&new_pipeline->description, &description, sizeof(description));
|
|
||||||
pipelines_.insert(std::make_pair(hash, new_pipeline));
|
|
||||||
COUNT_profile_set("gpu/pipeline_cache/pipelines", pipelines_.size());
|
|
||||||
#endif
|
|
||||||
|
|
||||||
current_pipeline_ = new_pipeline;
|
current_pipeline_ = new_pipeline;
|
||||||
*pipeline_handle_out = new_pipeline;
|
*pipeline_handle_out = new_pipeline;
|
||||||
|
@ -712,6 +712,16 @@ bool PipelineCache::GetCurrentStateDescription(
|
||||||
|
|
||||||
ID3D12PipelineState* PipelineCache::CreatePipelineState(
|
ID3D12PipelineState* PipelineCache::CreatePipelineState(
|
||||||
const PipelineDescription& description) {
|
const PipelineDescription& description) {
|
||||||
|
if (description.pixel_shader != nullptr) {
|
||||||
|
XELOGE("Creating graphics pipeline state with VS %.16" PRIX64
|
||||||
|
", PS %.16" PRIX64,
|
||||||
|
description.vertex_shader->ucode_data_hash(),
|
||||||
|
description.pixel_shader->ucode_data_hash());
|
||||||
|
} else {
|
||||||
|
XELOGE("Creating graphics pipeline state with VS %.16" PRIX64,
|
||||||
|
description.vertex_shader->ucode_data_hash());
|
||||||
|
}
|
||||||
|
|
||||||
D3D12_GRAPHICS_PIPELINE_STATE_DESC state_desc;
|
D3D12_GRAPHICS_PIPELINE_STATE_DESC state_desc;
|
||||||
std::memset(&state_desc, 0, sizeof(state_desc));
|
std::memset(&state_desc, 0, sizeof(state_desc));
|
||||||
|
|
||||||
|
@ -733,6 +743,12 @@ ID3D12PipelineState* PipelineCache::CreatePipelineState(
|
||||||
}
|
}
|
||||||
|
|
||||||
// Vertex or hull/domain shaders.
|
// Vertex or hull/domain shaders.
|
||||||
|
if (!description.vertex_shader->is_translated()) {
|
||||||
|
XELOGE("Vertex shader %.16" PRIX64 " not translated",
|
||||||
|
description.vertex_shader->ucode_data_hash());
|
||||||
|
assert_always();
|
||||||
|
return nullptr;
|
||||||
|
}
|
||||||
if (description.tessellation_mode != PipelineTessellationMode::kNone) {
|
if (description.tessellation_mode != PipelineTessellationMode::kNone) {
|
||||||
switch (description.patch_type) {
|
switch (description.patch_type) {
|
||||||
case PipelinePatchType::kTriangle:
|
case PipelinePatchType::kTriangle:
|
||||||
|
@ -740,9 +756,8 @@ ID3D12PipelineState* PipelineCache::CreatePipelineState(
|
||||||
PrimitiveType::kTrianglePatch) {
|
PrimitiveType::kTrianglePatch) {
|
||||||
XELOGE(
|
XELOGE(
|
||||||
"Tried to use vertex shader %.16" PRIX64
|
"Tried to use vertex shader %.16" PRIX64
|
||||||
" for triangle patch "
|
" for triangle patch tessellation, but it's not a tessellation "
|
||||||
"tessellation, but it's not a tessellation domain shader or has "
|
"domain shader or has the wrong domain",
|
||||||
"the wrong domain",
|
|
||||||
description.vertex_shader->ucode_data_hash());
|
description.vertex_shader->ucode_data_hash());
|
||||||
assert_always();
|
assert_always();
|
||||||
return nullptr;
|
return nullptr;
|
||||||
|
@ -765,11 +780,9 @@ ID3D12PipelineState* PipelineCache::CreatePipelineState(
|
||||||
case PipelinePatchType::kQuad:
|
case PipelinePatchType::kQuad:
|
||||||
if (description.vertex_shader->GetDomainShaderPrimitiveType() !=
|
if (description.vertex_shader->GetDomainShaderPrimitiveType() !=
|
||||||
PrimitiveType::kQuadPatch) {
|
PrimitiveType::kQuadPatch) {
|
||||||
XELOGE(
|
XELOGE("Tried to use vertex shader %.16" PRIX64
|
||||||
"Tried to use vertex shader %.16" PRIX64
|
" for quad patch tessellation, but it's not a tessellation "
|
||||||
" for quad patch "
|
"domain shader or has the wrong domain",
|
||||||
"tessellation, but it's not a tessellation domain shader or has "
|
|
||||||
"the wrong domain",
|
|
||||||
description.vertex_shader->ucode_data_hash());
|
description.vertex_shader->ucode_data_hash());
|
||||||
assert_always();
|
assert_always();
|
||||||
return nullptr;
|
return nullptr;
|
||||||
|
@ -849,6 +862,12 @@ ID3D12PipelineState* PipelineCache::CreatePipelineState(
|
||||||
|
|
||||||
// Pixel shader.
|
// Pixel shader.
|
||||||
if (description.pixel_shader != nullptr) {
|
if (description.pixel_shader != nullptr) {
|
||||||
|
if (!description.pixel_shader->is_translated()) {
|
||||||
|
XELOGE("Pixel shader %.16" PRIX64 " not translated",
|
||||||
|
description.pixel_shader->ucode_data_hash());
|
||||||
|
assert_always();
|
||||||
|
return nullptr;
|
||||||
|
}
|
||||||
state_desc.PS.pShaderBytecode =
|
state_desc.PS.pShaderBytecode =
|
||||||
description.pixel_shader->translated_binary().data();
|
description.pixel_shader->translated_binary().data();
|
||||||
state_desc.PS.BytecodeLength =
|
state_desc.PS.BytecodeLength =
|
||||||
|
@ -1000,6 +1019,15 @@ ID3D12PipelineState* PipelineCache::CreatePipelineState(
|
||||||
ID3D12PipelineState* state;
|
ID3D12PipelineState* state;
|
||||||
if (FAILED(device->CreateGraphicsPipelineState(&state_desc,
|
if (FAILED(device->CreateGraphicsPipelineState(&state_desc,
|
||||||
IID_PPV_ARGS(&state)))) {
|
IID_PPV_ARGS(&state)))) {
|
||||||
|
if (description.pixel_shader != nullptr) {
|
||||||
|
XELOGE("Failed to create graphics pipeline state with VS %.16" PRIX64
|
||||||
|
", PS %.16" PRIX64,
|
||||||
|
description.vertex_shader->ucode_data_hash(),
|
||||||
|
description.pixel_shader->ucode_data_hash());
|
||||||
|
} else {
|
||||||
|
XELOGE("Failed to create graphics pipeline state with VS %.16" PRIX64,
|
||||||
|
description.vertex_shader->ucode_data_hash());
|
||||||
|
}
|
||||||
return nullptr;
|
return nullptr;
|
||||||
}
|
}
|
||||||
std::wstring name;
|
std::wstring name;
|
||||||
|
|
|
@ -223,7 +223,7 @@ class PipelineCache {
|
||||||
// Manual-reset event set when the last queued pipeline is created and there
|
// Manual-reset event set when the last queued pipeline is created and there
|
||||||
// are no more pipelines to create. This is triggered by the thread creating
|
// are no more pipelines to create. This is triggered by the thread creating
|
||||||
// the last pipeline.
|
// the last pipeline.
|
||||||
std::unique_ptr<xe::threading::Event> creation_completion_event_;
|
std::unique_ptr<xe::threading::Event> creation_completion_event_ = nullptr;
|
||||||
// Whether setting the event on completion is queued. Protected with
|
// Whether setting the event on completion is queued. Protected with
|
||||||
// creation_request_lock_, notify_one creation_request_cond_ when set.
|
// creation_request_lock_, notify_one creation_request_cond_ when set.
|
||||||
bool creation_completion_set_event_ = false;
|
bool creation_completion_set_event_ = false;
|
||||||
|
|
Loading…
Reference in New Issue