[D3D12] Persistent shader and PSO storage
This commit is contained in:
parent
b1d3fd2ad3
commit
cde092ece1
|
@ -245,8 +245,8 @@ bool EmulatorWindow::Initialize() {
|
||||||
}
|
}
|
||||||
gpu_menu->AddChild(MenuItem::Create(MenuItem::Type::kSeparator));
|
gpu_menu->AddChild(MenuItem::Create(MenuItem::Type::kSeparator));
|
||||||
{
|
{
|
||||||
gpu_menu->AddChild(
|
gpu_menu->AddChild(MenuItem::Create(
|
||||||
MenuItem::Create(MenuItem::Type::kString, L"&Clear Caches", L"F5",
|
MenuItem::Type::kString, L"&Clear Runtime Caches", L"F5",
|
||||||
std::bind(&EmulatorWindow::GpuClearCaches, this)));
|
std::bind(&EmulatorWindow::GpuClearCaches, this)));
|
||||||
}
|
}
|
||||||
main_menu->AddChild(std::move(gpu_menu));
|
main_menu->AddChild(std::move(gpu_menu));
|
||||||
|
@ -454,8 +454,20 @@ void EmulatorWindow::UpdateTitle() {
|
||||||
title += xe::format_string(L" (@%.2fx)", Clock::guest_time_scalar());
|
title += xe::format_string(L" (@%.2fx)", Clock::guest_time_scalar());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
if (initializing_shader_storage_) {
|
||||||
|
title += L" (Preloading shaders\u2026)";
|
||||||
|
}
|
||||||
|
|
||||||
window_->set_title(title);
|
window_->set_title(title);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void EmulatorWindow::SetInitializingShaderStorage(bool initializing) {
|
||||||
|
if (initializing_shader_storage_ == initializing) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
initializing_shader_storage_ = initializing;
|
||||||
|
UpdateTitle();
|
||||||
|
}
|
||||||
|
|
||||||
} // namespace app
|
} // namespace app
|
||||||
} // namespace xe
|
} // namespace xe
|
||||||
|
|
|
@ -37,6 +37,7 @@ class EmulatorWindow {
|
||||||
|
|
||||||
void UpdateTitle();
|
void UpdateTitle();
|
||||||
void ToggleFullscreen();
|
void ToggleFullscreen();
|
||||||
|
void SetInitializingShaderStorage(bool initializing);
|
||||||
|
|
||||||
private:
|
private:
|
||||||
explicit EmulatorWindow(Emulator* emulator);
|
explicit EmulatorWindow(Emulator* emulator);
|
||||||
|
@ -63,6 +64,7 @@ class EmulatorWindow {
|
||||||
std::unique_ptr<ui::Window> window_;
|
std::unique_ptr<ui::Window> window_;
|
||||||
std::wstring base_title_;
|
std::wstring base_title_;
|
||||||
uint64_t cursor_hide_time_ = 0;
|
uint64_t cursor_hide_time_ = 0;
|
||||||
|
bool initializing_shader_storage_ = false;
|
||||||
};
|
};
|
||||||
|
|
||||||
} // namespace app
|
} // namespace app
|
||||||
|
|
|
@ -243,7 +243,7 @@ int xenia_main(const std::vector<std::wstring>& args) {
|
||||||
}
|
}
|
||||||
|
|
||||||
// Create the emulator but don't initialize so we can setup the window.
|
// Create the emulator but don't initialize so we can setup the window.
|
||||||
auto emulator = std::make_unique<Emulator>(L"", content_root);
|
auto emulator = std::make_unique<Emulator>(L"", storage_root, content_root);
|
||||||
|
|
||||||
// Main emulator display window.
|
// Main emulator display window.
|
||||||
auto emulator_window = EmulatorWindow::Create(emulator.get());
|
auto emulator_window = EmulatorWindow::Create(emulator.get());
|
||||||
|
@ -331,6 +331,11 @@ int xenia_main(const std::vector<std::wstring>& args) {
|
||||||
evt->Set();
|
evt->Set();
|
||||||
});
|
});
|
||||||
|
|
||||||
|
emulator->on_shader_storage_initialization.AddListener(
|
||||||
|
[&](bool initializing) {
|
||||||
|
emulator_window->SetInitializingShaderStorage(initializing);
|
||||||
|
});
|
||||||
|
|
||||||
emulator->on_terminate.AddListener([&]() {
|
emulator->on_terminate.AddListener([&]() {
|
||||||
if (cvars::discord) {
|
if (cvars::discord) {
|
||||||
discord::DiscordPresence::NotPlaying();
|
discord::DiscordPresence::NotPlaying();
|
||||||
|
|
|
@ -58,6 +58,17 @@ bool CreateFile(const std::wstring& path);
|
||||||
// This behaves like fopen and the returned handle can be used with stdio.
|
// This behaves like fopen and the returned handle can be used with stdio.
|
||||||
FILE* OpenFile(const std::wstring& path, const char* mode);
|
FILE* OpenFile(const std::wstring& path, const char* mode);
|
||||||
|
|
||||||
|
// Wrapper for the 64-bit version of fseek, returns true on success.
|
||||||
|
bool Seek(FILE* file, int64_t offset, int origin);
|
||||||
|
|
||||||
|
// Wrapper for the 64-bit version of ftell, returns a positive value on success.
|
||||||
|
int64_t Tell(FILE* file);
|
||||||
|
|
||||||
|
// Reduces the size of a stdio file opened for writing. The file pointer is
|
||||||
|
// clamped. If this returns false, the size of the file and the file pointer are
|
||||||
|
// undefined.
|
||||||
|
bool TruncateStdioFile(FILE* file, uint64_t length);
|
||||||
|
|
||||||
// Deletes the file at the given path.
|
// Deletes the file at the given path.
|
||||||
// Returns true if the file was found and removed.
|
// Returns true if the file was found and removed.
|
||||||
bool DeleteFile(const std::wstring& path);
|
bool DeleteFile(const std::wstring& path);
|
||||||
|
|
|
@ -76,6 +76,31 @@ FILE* OpenFile(const std::wstring& path, const char* mode) {
|
||||||
return fopen(xe::to_string(fixed_path).c_str(), mode);
|
return fopen(xe::to_string(fixed_path).c_str(), mode);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool Seek(FILE* file, int64_t offset, int origin) {
|
||||||
|
return fseeko64(file, off64_t(offset), origin) == 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
int64_t Tell(FILE* file) { return int64_t(ftello64(file)); }
|
||||||
|
|
||||||
|
bool TruncateStdioFile(FILE* file, uint64_t length) {
|
||||||
|
if (fflush(file)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
int64_t position = Tell(file);
|
||||||
|
if (position < 0) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if (ftruncate64(fileno(file), off64_t(length))) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if (uint64_t(position) > length) {
|
||||||
|
if (!Seek(file, 0, SEEK_END)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
bool CreateFolder(const std::wstring& path) {
|
bool CreateFolder(const std::wstring& path) {
|
||||||
return mkdir(xe::to_string(path).c_str(), 0774);
|
return mkdir(xe::to_string(path).c_str(), 0774);
|
||||||
}
|
}
|
||||||
|
|
|
@ -12,6 +12,7 @@
|
||||||
|
|
||||||
#include <string>
|
#include <string>
|
||||||
|
|
||||||
|
#include <io.h>
|
||||||
#include <shlobj.h>
|
#include <shlobj.h>
|
||||||
|
|
||||||
#include "xenia/base/platform_win.h"
|
#include "xenia/base/platform_win.h"
|
||||||
|
@ -87,6 +88,32 @@ FILE* OpenFile(const std::wstring& path, const char* mode) {
|
||||||
return _wfopen(fixed_path.c_str(), xe::to_wstring(mode).c_str());
|
return _wfopen(fixed_path.c_str(), xe::to_wstring(mode).c_str());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
bool Seek(FILE* file, int64_t offset, int origin) {
|
||||||
|
return _fseeki64(file, offset, origin) == 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
int64_t Tell(FILE* file) { return _ftelli64(file); }
|
||||||
|
|
||||||
|
bool TruncateStdioFile(FILE* file, uint64_t length) {
|
||||||
|
// Flush is necessary - if not flushing, stream position may be out of sync.
|
||||||
|
if (fflush(file)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
int64_t position = Tell(file);
|
||||||
|
if (position < 0) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if (_chsize_s(_fileno(file), int64_t(length))) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
if (uint64_t(position) > length) {
|
||||||
|
if (!Seek(file, 0, SEEK_END)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
bool DeleteFile(const std::wstring& path) {
|
bool DeleteFile(const std::wstring& path) {
|
||||||
return DeleteFileW(path.c_str()) ? true : false;
|
return DeleteFileW(path.c_str()) ? true : false;
|
||||||
}
|
}
|
||||||
|
|
|
@ -57,11 +57,13 @@ DEFINE_string(
|
||||||
namespace xe {
|
namespace xe {
|
||||||
|
|
||||||
Emulator::Emulator(const std::wstring& command_line,
|
Emulator::Emulator(const std::wstring& command_line,
|
||||||
|
const std::wstring& storage_root,
|
||||||
const std::wstring& content_root)
|
const std::wstring& content_root)
|
||||||
: on_launch(),
|
: on_launch(),
|
||||||
on_terminate(),
|
on_terminate(),
|
||||||
on_exit(),
|
on_exit(),
|
||||||
command_line_(command_line),
|
command_line_(command_line),
|
||||||
|
storage_root_(storage_root),
|
||||||
content_root_(content_root),
|
content_root_(content_root),
|
||||||
game_title_(),
|
game_title_(),
|
||||||
display_window_(nullptr),
|
display_window_(nullptr),
|
||||||
|
@ -685,11 +687,18 @@ X_STATUS Emulator::CompleteLaunch(const std::wstring& path,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Initializing the shader storage in a blocking way so the user doesn't miss
|
||||||
|
// the initial seconds - for instance, sound from an intro video may start
|
||||||
|
// playing before the video can be seen if doing this in parallel with the
|
||||||
|
// main thread.
|
||||||
|
on_shader_storage_initialization(true);
|
||||||
|
graphics_system_->InitializeShaderStorage(storage_root_, title_id_, true);
|
||||||
|
on_shader_storage_initialization(false);
|
||||||
|
|
||||||
auto main_thread = kernel_state_->LaunchModule(module);
|
auto main_thread = kernel_state_->LaunchModule(module);
|
||||||
if (!main_thread) {
|
if (!main_thread) {
|
||||||
return X_STATUS_UNSUCCESSFUL;
|
return X_STATUS_UNSUCCESSFUL;
|
||||||
}
|
}
|
||||||
|
|
||||||
main_thread_ = main_thread;
|
main_thread_ = main_thread;
|
||||||
on_launch(title_id_, game_title_);
|
on_launch(title_id_, game_title_);
|
||||||
|
|
||||||
|
|
|
@ -48,13 +48,17 @@ namespace xe {
|
||||||
class Emulator {
|
class Emulator {
|
||||||
public:
|
public:
|
||||||
explicit Emulator(const std::wstring& command_line,
|
explicit Emulator(const std::wstring& command_line,
|
||||||
|
const std::wstring& storage_root,
|
||||||
const std::wstring& content_root);
|
const std::wstring& content_root);
|
||||||
~Emulator();
|
~Emulator();
|
||||||
|
|
||||||
// Full command line used when launching the process.
|
// Full command line used when launching the process.
|
||||||
const std::wstring& command_line() const { return command_line_; }
|
const std::wstring& command_line() const { return command_line_; }
|
||||||
|
|
||||||
// Folder content is stored in.
|
// Folder persistent internal emulator data is stored in.
|
||||||
|
const std::wstring& storage_root() const { return storage_root_; }
|
||||||
|
|
||||||
|
// Folder guest content is stored in.
|
||||||
const std::wstring& content_root() const { return content_root_; }
|
const std::wstring& content_root() const { return content_root_; }
|
||||||
|
|
||||||
// Title of the game in the default language.
|
// Title of the game in the default language.
|
||||||
|
@ -146,6 +150,7 @@ class Emulator {
|
||||||
|
|
||||||
public:
|
public:
|
||||||
xe::Delegate<uint32_t, const std::wstring&> on_launch;
|
xe::Delegate<uint32_t, const std::wstring&> on_launch;
|
||||||
|
xe::Delegate<bool> on_shader_storage_initialization;
|
||||||
xe::Delegate<> on_terminate;
|
xe::Delegate<> on_terminate;
|
||||||
xe::Delegate<> on_exit;
|
xe::Delegate<> on_exit;
|
||||||
|
|
||||||
|
@ -159,6 +164,7 @@ class Emulator {
|
||||||
const std::string& module_path);
|
const std::string& module_path);
|
||||||
|
|
||||||
std::wstring command_line_;
|
std::wstring command_line_;
|
||||||
|
std::wstring storage_root_;
|
||||||
std::wstring content_root_;
|
std::wstring content_root_;
|
||||||
|
|
||||||
std::wstring game_title_;
|
std::wstring game_title_;
|
||||||
|
|
|
@ -87,6 +87,10 @@ void CommandProcessor::Shutdown() {
|
||||||
worker_thread_.reset();
|
worker_thread_.reset();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void CommandProcessor::InitializeShaderStorage(const std::wstring& storage_root,
|
||||||
|
uint32_t title_id,
|
||||||
|
bool blocking) {}
|
||||||
|
|
||||||
void CommandProcessor::RequestFrameTrace(const std::wstring& root_path) {
|
void CommandProcessor::RequestFrameTrace(const std::wstring& root_path) {
|
||||||
if (trace_state_ == TraceState::kStreaming) {
|
if (trace_state_ == TraceState::kStreaming) {
|
||||||
XELOGE("Streaming trace; cannot also trace frame.");
|
XELOGE("Streaming trace; cannot also trace frame.");
|
||||||
|
|
|
@ -130,6 +130,12 @@ class CommandProcessor {
|
||||||
swap_request_handler_ = fn;
|
swap_request_handler_ = fn;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// May be called not only from the command processor thread when the command
|
||||||
|
// processor is paused, and the termination of this function may be explicitly
|
||||||
|
// awaited.
|
||||||
|
virtual void InitializeShaderStorage(const std::wstring& storage_root,
|
||||||
|
uint32_t title_id, bool blocking);
|
||||||
|
|
||||||
virtual void RequestFrameTrace(const std::wstring& root_path);
|
virtual void RequestFrameTrace(const std::wstring& root_path);
|
||||||
virtual void BeginTracing(const std::wstring& root_path);
|
virtual void BeginTracing(const std::wstring& root_path);
|
||||||
virtual void EndTracing();
|
virtual void EndTracing();
|
||||||
|
|
|
@ -77,6 +77,12 @@ void D3D12CommandProcessor::ClearCaches() {
|
||||||
cache_clear_requested_ = true;
|
cache_clear_requested_ = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void D3D12CommandProcessor::InitializeShaderStorage(
|
||||||
|
const std::wstring& storage_root, uint32_t title_id, bool blocking) {
|
||||||
|
CommandProcessor::InitializeShaderStorage(storage_root, title_id, blocking);
|
||||||
|
pipeline_cache_->InitializeShaderStorage(storage_root, title_id, blocking);
|
||||||
|
}
|
||||||
|
|
||||||
void D3D12CommandProcessor::RequestFrameTrace(const std::wstring& root_path) {
|
void D3D12CommandProcessor::RequestFrameTrace(const std::wstring& root_path) {
|
||||||
// Capture with PIX if attached.
|
// Capture with PIX if attached.
|
||||||
if (GetD3D12Context()->GetD3D12Provider()->GetGraphicsAnalysis() != nullptr) {
|
if (GetD3D12Context()->GetD3D12Provider()->GetGraphicsAnalysis() != nullptr) {
|
||||||
|
@ -2123,7 +2129,7 @@ bool D3D12CommandProcessor::EndSubmission(bool is_swap) {
|
||||||
}
|
}
|
||||||
|
|
||||||
bool D3D12CommandProcessor::CanEndSubmissionImmediately() const {
|
bool D3D12CommandProcessor::CanEndSubmissionImmediately() const {
|
||||||
return !submission_open_ || !pipeline_cache_->IsCreatingPipelines();
|
return !submission_open_ || !pipeline_cache_->IsCreatingPipelineStates();
|
||||||
}
|
}
|
||||||
|
|
||||||
void D3D12CommandProcessor::AwaitAllSubmissionsCompletion() {
|
void D3D12CommandProcessor::AwaitAllSubmissionsCompletion() {
|
||||||
|
|
|
@ -43,6 +43,9 @@ class D3D12CommandProcessor : public CommandProcessor {
|
||||||
|
|
||||||
void ClearCaches() override;
|
void ClearCaches() override;
|
||||||
|
|
||||||
|
void InitializeShaderStorage(const std::wstring& storage_root,
|
||||||
|
uint32_t title_id, bool blocking) override;
|
||||||
|
|
||||||
void RequestFrameTrace(const std::wstring& root_path) override;
|
void RequestFrameTrace(const std::wstring& root_path) override;
|
||||||
|
|
||||||
void TracePlaybackWroteMemory(uint32_t base_ptr, uint32_t length) override;
|
void TracePlaybackWroteMemory(uint32_t base_ptr, uint32_t length) override;
|
||||||
|
@ -125,10 +128,11 @@ class D3D12CommandProcessor : public CommandProcessor {
|
||||||
// render targets or copying to depth render targets.
|
// render targets or copying to depth render targets.
|
||||||
void SetSamplePositions(MsaaSamples sample_positions);
|
void SetSamplePositions(MsaaSamples sample_positions);
|
||||||
|
|
||||||
// Returns a pipeline with deferred creation by its handle. May return nullptr
|
// Returns a pipeline state object with deferred creation by its handle. May
|
||||||
// if failed to create the pipeline.
|
// return nullptr if failed to create the pipeline state object.
|
||||||
inline ID3D12PipelineState* GetPipelineStateByHandle(void* handle) const {
|
inline ID3D12PipelineState* GetD3D12PipelineStateByHandle(
|
||||||
return pipeline_cache_->GetPipelineStateByHandle(handle);
|
void* handle) const {
|
||||||
|
return pipeline_cache_->GetD3D12PipelineStateByHandle(handle);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Sets the current pipeline state to a compute pipeline. This is for cache
|
// Sets the current pipeline state to a compute pipeline. This is for cache
|
||||||
|
|
|
@ -200,7 +200,8 @@ void DeferredCommandList::Execute(ID3D12GraphicsCommandList* command_list,
|
||||||
}
|
}
|
||||||
} break;
|
} break;
|
||||||
case Command::kSetPipelineStateHandle: {
|
case Command::kSetPipelineStateHandle: {
|
||||||
current_pipeline_state = command_processor_->GetPipelineStateByHandle(
|
current_pipeline_state =
|
||||||
|
command_processor_->GetD3D12PipelineStateByHandle(
|
||||||
*reinterpret_cast<void* const*>(stream));
|
*reinterpret_cast<void* const*>(stream));
|
||||||
if (current_pipeline_state) {
|
if (current_pipeline_state) {
|
||||||
command_list->SetPipelineState(current_pipeline_state);
|
command_list->SetPipelineState(current_pipeline_state);
|
||||||
|
|
File diff suppressed because it is too large
Load Diff
|
@ -11,13 +11,17 @@
|
||||||
#define XENIA_GPU_D3D12_PIPELINE_CACHE_H_
|
#define XENIA_GPU_D3D12_PIPELINE_CACHE_H_
|
||||||
|
|
||||||
#include <condition_variable>
|
#include <condition_variable>
|
||||||
|
#include <cstdio>
|
||||||
#include <deque>
|
#include <deque>
|
||||||
#include <memory>
|
#include <memory>
|
||||||
#include <mutex>
|
#include <mutex>
|
||||||
|
#include <string>
|
||||||
#include <thread>
|
#include <thread>
|
||||||
#include <unordered_map>
|
#include <unordered_map>
|
||||||
|
#include <utility>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
|
||||||
|
#include "xenia/base/platform.h"
|
||||||
#include "xenia/base/threading.h"
|
#include "xenia/base/threading.h"
|
||||||
#include "xenia/gpu/d3d12/d3d12_shader.h"
|
#include "xenia/gpu/d3d12/d3d12_shader.h"
|
||||||
#include "xenia/gpu/d3d12/render_target_cache.h"
|
#include "xenia/gpu/d3d12/render_target_cache.h"
|
||||||
|
@ -40,10 +44,14 @@ class PipelineCache {
|
||||||
|
|
||||||
bool Initialize();
|
bool Initialize();
|
||||||
void Shutdown();
|
void Shutdown();
|
||||||
void ClearCache();
|
void ClearCache(bool shutting_down = false);
|
||||||
|
|
||||||
|
void InitializeShaderStorage(const std::wstring& storage_root,
|
||||||
|
uint32_t title_id, bool blocking);
|
||||||
|
void ShutdownShaderStorage();
|
||||||
|
|
||||||
void EndSubmission();
|
void EndSubmission();
|
||||||
bool IsCreatingPipelines();
|
bool IsCreatingPipelineStates();
|
||||||
|
|
||||||
D3D12Shader* LoadShader(ShaderType shader_type, uint32_t guest_address,
|
D3D12Shader* LoadShader(ShaderType shader_type, uint32_t guest_address,
|
||||||
const uint32_t* host_address, uint32_t dword_count);
|
const uint32_t* host_address, uint32_t dword_count);
|
||||||
|
@ -57,15 +65,32 @@ class PipelineCache {
|
||||||
D3D12Shader* vertex_shader, D3D12Shader* pixel_shader, bool tessellated,
|
D3D12Shader* vertex_shader, D3D12Shader* pixel_shader, bool tessellated,
|
||||||
PrimitiveType primitive_type, IndexFormat index_format, bool early_z,
|
PrimitiveType primitive_type, IndexFormat index_format, bool early_z,
|
||||||
const RenderTargetCache::PipelineRenderTarget render_targets[5],
|
const RenderTargetCache::PipelineRenderTarget render_targets[5],
|
||||||
void** pipeline_handle_out, ID3D12RootSignature** root_signature_out);
|
void** pipeline_state_handle_out,
|
||||||
|
ID3D12RootSignature** root_signature_out);
|
||||||
|
|
||||||
// Returns a pipeline with deferred creation by its handle. May return nullptr
|
// Returns a pipeline state object with deferred creation by its handle. May
|
||||||
// if failed to create the pipeline.
|
// return nullptr if failed to create the pipeline state object.
|
||||||
inline ID3D12PipelineState* GetPipelineStateByHandle(void* handle) const {
|
inline ID3D12PipelineState* GetD3D12PipelineStateByHandle(
|
||||||
return reinterpret_cast<const Pipeline*>(handle)->state;
|
void* handle) const {
|
||||||
|
return reinterpret_cast<const PipelineState*>(handle)->state;
|
||||||
}
|
}
|
||||||
|
|
||||||
private:
|
private:
|
||||||
|
XEPACKEDSTRUCT(ShaderStoredHeader, {
|
||||||
|
uint64_t ucode_data_hash;
|
||||||
|
|
||||||
|
uint32_t ucode_dword_count : 16;
|
||||||
|
ShaderType type : 1;
|
||||||
|
PrimitiveType patch_primitive_type : 6;
|
||||||
|
|
||||||
|
reg::SQ_PROGRAM_CNTL sq_program_cntl;
|
||||||
|
|
||||||
|
static constexpr uint32_t kVersion = 0x20200301;
|
||||||
|
});
|
||||||
|
|
||||||
|
// Update PipelineDescription::kVersion if any of the Pipeline* enums are
|
||||||
|
// changed!
|
||||||
|
|
||||||
enum class PipelineStripCutIndex : uint32_t {
|
enum class PipelineStripCutIndex : uint32_t {
|
||||||
kNone,
|
kNone,
|
||||||
kFFFF,
|
kFFFF,
|
||||||
|
@ -122,7 +147,8 @@ class PipelineCache {
|
||||||
kSrcAlphaSat,
|
kSrcAlphaSat,
|
||||||
};
|
};
|
||||||
|
|
||||||
struct PipelineRenderTarget {
|
// Update PipelineDescription::kVersion if anything is changed!
|
||||||
|
XEPACKEDSTRUCT(PipelineRenderTarget, {
|
||||||
uint32_t used : 1; // 1
|
uint32_t used : 1; // 1
|
||||||
ColorRenderTargetFormat format : 4; // 5
|
ColorRenderTargetFormat format : 4; // 5
|
||||||
PipelineBlendFactor src_blend : 4; // 9
|
PipelineBlendFactor src_blend : 4; // 9
|
||||||
|
@ -132,12 +158,12 @@ class PipelineCache {
|
||||||
PipelineBlendFactor dest_blend_alpha : 4; // 24
|
PipelineBlendFactor dest_blend_alpha : 4; // 24
|
||||||
BlendOp blend_op_alpha : 3; // 27
|
BlendOp blend_op_alpha : 3; // 27
|
||||||
uint32_t write_mask : 4; // 31
|
uint32_t write_mask : 4; // 31
|
||||||
};
|
});
|
||||||
|
|
||||||
struct PipelineDescription {
|
XEPACKEDSTRUCT(PipelineDescription, {
|
||||||
ID3D12RootSignature* root_signature;
|
uint64_t vertex_shader_hash;
|
||||||
D3D12Shader* vertex_shader;
|
// 0 if drawing without a pixel shader.
|
||||||
D3D12Shader* pixel_shader;
|
uint64_t pixel_shader_hash;
|
||||||
|
|
||||||
int32_t depth_bias;
|
int32_t depth_bias;
|
||||||
float depth_bias_slope_scaled;
|
float depth_bias_slope_scaled;
|
||||||
|
@ -170,19 +196,34 @@ class PipelineCache {
|
||||||
CompareFunction stencil_back_func : 3; // 32
|
CompareFunction stencil_back_func : 3; // 32
|
||||||
|
|
||||||
PipelineRenderTarget render_targets[4];
|
PipelineRenderTarget render_targets[4];
|
||||||
|
|
||||||
|
static constexpr uint32_t kVersion = 0x20200309;
|
||||||
|
});
|
||||||
|
|
||||||
|
XEPACKEDSTRUCT(PipelineStoredDescription, {
|
||||||
|
uint64_t description_hash;
|
||||||
|
PipelineDescription description;
|
||||||
|
});
|
||||||
|
|
||||||
|
struct PipelineRuntimeDescription {
|
||||||
|
ID3D12RootSignature* root_signature;
|
||||||
|
D3D12Shader* vertex_shader;
|
||||||
|
D3D12Shader* pixel_shader;
|
||||||
|
PipelineDescription description;
|
||||||
};
|
};
|
||||||
|
|
||||||
bool TranslateShader(D3D12Shader* shader, reg::SQ_PROGRAM_CNTL cntl,
|
bool TranslateShader(DxbcShaderTranslator& translator, D3D12Shader* shader,
|
||||||
bool tessellated, PrimitiveType primitive_type);
|
reg::SQ_PROGRAM_CNTL cntl,
|
||||||
|
PrimitiveType patch_primitive_type);
|
||||||
|
|
||||||
bool GetCurrentStateDescription(
|
bool GetCurrentStateDescription(
|
||||||
D3D12Shader* vertex_shader, D3D12Shader* pixel_shader, bool tessellated,
|
D3D12Shader* vertex_shader, D3D12Shader* pixel_shader, bool tessellated,
|
||||||
PrimitiveType primitive_type, IndexFormat index_format, bool early_z,
|
PrimitiveType primitive_type, IndexFormat index_format, bool early_z,
|
||||||
const RenderTargetCache::PipelineRenderTarget render_targets[5],
|
const RenderTargetCache::PipelineRenderTarget render_targets[5],
|
||||||
PipelineDescription& description_out);
|
PipelineRuntimeDescription& runtime_description_out);
|
||||||
|
|
||||||
ID3D12PipelineState* CreatePipelineState(
|
ID3D12PipelineState* CreateD3D12PipelineState(
|
||||||
const PipelineDescription& description);
|
const PipelineRuntimeDescription& runtime_description);
|
||||||
|
|
||||||
D3D12CommandProcessor* command_processor_;
|
D3D12CommandProcessor* command_processor_;
|
||||||
RegisterFile* register_file_;
|
RegisterFile* register_file_;
|
||||||
|
@ -200,40 +241,71 @@ class PipelineCache {
|
||||||
// Xenos pixel shader provided.
|
// Xenos pixel shader provided.
|
||||||
std::vector<uint8_t> depth_only_pixel_shader_;
|
std::vector<uint8_t> depth_only_pixel_shader_;
|
||||||
|
|
||||||
struct Pipeline {
|
struct PipelineState {
|
||||||
// nullptr if creation has failed.
|
// nullptr if creation has failed.
|
||||||
ID3D12PipelineState* state;
|
ID3D12PipelineState* state;
|
||||||
PipelineDescription description;
|
PipelineRuntimeDescription description;
|
||||||
};
|
};
|
||||||
// All previously generated pipelines identified by hash and the description.
|
// All previously generated pipeline state objects identified by hash and the
|
||||||
std::unordered_multimap<uint64_t, Pipeline*> pipelines_;
|
// description.
|
||||||
|
std::unordered_multimap<uint64_t, PipelineState*> pipeline_states_;
|
||||||
|
|
||||||
// Previously used pipeline. This matches our current state settings
|
// Previously used pipeline state object. This matches our current state
|
||||||
// and allows us to quickly(ish) reuse the pipeline if no registers have
|
// settings and allows us to quickly(ish) reuse the pipeline state if no
|
||||||
// changed.
|
// registers have changed.
|
||||||
Pipeline* current_pipeline_ = nullptr;
|
PipelineState* current_pipeline_state_ = nullptr;
|
||||||
|
|
||||||
// Pipeline creation threads.
|
// Currently open shader storage path.
|
||||||
void CreationThread();
|
std::wstring shader_storage_root_;
|
||||||
|
uint32_t shader_storage_title_id_ = 0;
|
||||||
|
|
||||||
|
// Shader storage output stream, for preload in the next emulator runs.
|
||||||
|
FILE* shader_storage_file_ = nullptr;
|
||||||
|
bool shader_storage_file_flush_needed_ = false;
|
||||||
|
|
||||||
|
// Pipeline state storage output stream, for preload in the next emulator
|
||||||
|
// runs.
|
||||||
|
FILE* pipeline_state_storage_file_ = nullptr;
|
||||||
|
bool pipeline_state_storage_file_flush_needed_ = false;
|
||||||
|
|
||||||
|
// Thread for asynchronous writing to the storage streams.
|
||||||
|
void StorageWriteThread();
|
||||||
|
std::mutex storage_write_request_lock_;
|
||||||
|
std::condition_variable storage_write_request_cond_;
|
||||||
|
// Storage thread input is protected with storage_write_request_lock_, and the
|
||||||
|
// thread is notified about its change via storage_write_request_cond_.
|
||||||
|
std::deque<std::pair<const Shader*, reg::SQ_PROGRAM_CNTL>>
|
||||||
|
storage_write_shader_queue_;
|
||||||
|
std::deque<PipelineStoredDescription> storage_write_pipeline_state_queue_;
|
||||||
|
bool storage_write_flush_shaders_ = false;
|
||||||
|
bool storage_write_flush_pipeline_states_ = false;
|
||||||
|
bool storage_write_thread_shutdown_ = false;
|
||||||
|
std::unique_ptr<xe::threading::Thread> storage_write_thread_;
|
||||||
|
|
||||||
|
// Pipeline state object creation threads.
|
||||||
|
void CreationThread(size_t thread_index);
|
||||||
|
void CreateQueuedPipelineStatesOnProcessorThread();
|
||||||
std::mutex creation_request_lock_;
|
std::mutex creation_request_lock_;
|
||||||
std::condition_variable creation_request_cond_;
|
std::condition_variable creation_request_cond_;
|
||||||
// Protected with creation_request_lock_, notify_one creation_request_cond_
|
// Protected with creation_request_lock_, notify_one creation_request_cond_
|
||||||
// when set.
|
// when set.
|
||||||
std::deque<Pipeline*> creation_queue_;
|
std::deque<PipelineState*> creation_queue_;
|
||||||
// Number of threads that are currently creating a pipeline - incremented when
|
// Number of threads that are currently creating a pipeline state object -
|
||||||
// a pipeline is dequeued (the completion event can't be triggered before this
|
// incremented when a pipeline state object is dequeued (the completion event
|
||||||
// is zero). Protected with creation_request_lock_.
|
// can't be triggered before this is zero). Protected with
|
||||||
uint32_t creation_threads_busy_ = 0;
|
// creation_request_lock_.
|
||||||
// Manual-reset event set when the last queued pipeline is created and there
|
size_t creation_threads_busy_ = 0;
|
||||||
// are no more pipelines to create. This is triggered by the thread creating
|
// Manual-reset event set when the last queued pipeline state object is
|
||||||
// the last pipeline.
|
// created and there are no more pipeline state objects to create. This is
|
||||||
|
// triggered by the thread creating the last pipeline state object.
|
||||||
std::unique_ptr<xe::threading::Event> creation_completion_event_ = nullptr;
|
std::unique_ptr<xe::threading::Event> creation_completion_event_ = nullptr;
|
||||||
// Whether setting the event on completion is queued. Protected with
|
// Whether setting the event on completion is queued. Protected with
|
||||||
// creation_request_lock_, notify_one creation_request_cond_ when set.
|
// creation_request_lock_, notify_one creation_request_cond_ when set.
|
||||||
bool creation_completion_set_event_ = false;
|
bool creation_completion_set_event_ = false;
|
||||||
// Whether to shut down the creation threads as soon as possible. Protected
|
// Creation threads with this index or above need to be shut down as soon as
|
||||||
// with creation_request_lock_, notify_all creation_request_cond_ when set.
|
// possible. Protected with creation_request_lock_, notify_all
|
||||||
bool creation_threads_shutdown_ = false;
|
// creation_request_cond_ when set.
|
||||||
|
size_t creation_threads_shutdown_from_ = SIZE_MAX;
|
||||||
std::vector<std::unique_ptr<xe::threading::Thread>> creation_threads_;
|
std::vector<std::unique_ptr<xe::threading::Thread>> creation_threads_;
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
|
@ -13,8 +13,10 @@ DEFINE_string(trace_gpu_prefix, "scratch/gpu/",
|
||||||
"Prefix path for GPU trace files.", "GPU");
|
"Prefix path for GPU trace files.", "GPU");
|
||||||
DEFINE_bool(trace_gpu_stream, false, "Trace all GPU packets.", "GPU");
|
DEFINE_bool(trace_gpu_stream, false, "Trace all GPU packets.", "GPU");
|
||||||
|
|
||||||
DEFINE_string(dump_shaders, "",
|
DEFINE_string(
|
||||||
"Path to write GPU shaders to as they are compiled.", "GPU");
|
dump_shaders, "",
|
||||||
|
"For shader debugging, path to dump GPU shaders to as they are compiled.",
|
||||||
|
"GPU");
|
||||||
|
|
||||||
DEFINE_bool(vsync, true, "Enable VSYNC.", "GPU");
|
DEFINE_bool(vsync, true, "Enable VSYNC.", "GPU");
|
||||||
|
|
||||||
|
|
|
@ -20,6 +20,12 @@
|
||||||
#include "xenia/ui/graphics_provider.h"
|
#include "xenia/ui/graphics_provider.h"
|
||||||
#include "xenia/ui/loop.h"
|
#include "xenia/ui/loop.h"
|
||||||
|
|
||||||
|
DEFINE_bool(
|
||||||
|
store_shaders, true,
|
||||||
|
"Store shaders persistently and load them when loading games to avoid "
|
||||||
|
"runtime spikes and freezes when playing the game not for the first time.",
|
||||||
|
"GPU");
|
||||||
|
|
||||||
namespace xe {
|
namespace xe {
|
||||||
namespace gpu {
|
namespace gpu {
|
||||||
|
|
||||||
|
@ -269,6 +275,34 @@ void GraphicsSystem::ClearCaches() {
|
||||||
[&]() { command_processor_->ClearCaches(); });
|
[&]() { command_processor_->ClearCaches(); });
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void GraphicsSystem::InitializeShaderStorage(const std::wstring& storage_root,
|
||||||
|
uint32_t title_id, bool blocking) {
|
||||||
|
if (!cvars::store_shaders) {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
if (blocking) {
|
||||||
|
if (command_processor_->is_paused()) {
|
||||||
|
// Safe to run on any thread while the command processor is paused, no
|
||||||
|
// race condition.
|
||||||
|
command_processor_->InitializeShaderStorage(storage_root, title_id, true);
|
||||||
|
} else {
|
||||||
|
xe::threading::Fence fence;
|
||||||
|
command_processor_->CallInThread(
|
||||||
|
[this, storage_root, title_id, &fence]() {
|
||||||
|
command_processor_->InitializeShaderStorage(storage_root, title_id,
|
||||||
|
true);
|
||||||
|
fence.Signal();
|
||||||
|
});
|
||||||
|
fence.Wait();
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
command_processor_->CallInThread([this, storage_root, title_id]() {
|
||||||
|
command_processor_->InitializeShaderStorage(storage_root, title_id,
|
||||||
|
false);
|
||||||
|
});
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
void GraphicsSystem::RequestFrameTrace() {
|
void GraphicsSystem::RequestFrameTrace() {
|
||||||
command_processor_->RequestFrameTrace(
|
command_processor_->RequestFrameTrace(
|
||||||
xe::to_wstring(cvars::trace_gpu_prefix));
|
xe::to_wstring(cvars::trace_gpu_prefix));
|
||||||
|
|
|
@ -12,6 +12,7 @@
|
||||||
|
|
||||||
#include <atomic>
|
#include <atomic>
|
||||||
#include <memory>
|
#include <memory>
|
||||||
|
#include <string>
|
||||||
#include <thread>
|
#include <thread>
|
||||||
|
|
||||||
#include "xenia/cpu/processor.h"
|
#include "xenia/cpu/processor.h"
|
||||||
|
@ -62,6 +63,9 @@ class GraphicsSystem {
|
||||||
|
|
||||||
virtual void ClearCaches();
|
virtual void ClearCaches();
|
||||||
|
|
||||||
|
void InitializeShaderStorage(const std::wstring& storage_root,
|
||||||
|
uint32_t title_id, bool blocking);
|
||||||
|
|
||||||
void RequestFrameTrace();
|
void RequestFrameTrace();
|
||||||
void BeginTracing();
|
void BeginTracing();
|
||||||
void EndTracing();
|
void EndTracing();
|
||||||
|
|
|
@ -102,7 +102,7 @@ int TraceDump::Main(const std::vector<std::wstring>& args) {
|
||||||
|
|
||||||
bool TraceDump::Setup() {
|
bool TraceDump::Setup() {
|
||||||
// Create the emulator but don't initialize so we can setup the window.
|
// Create the emulator but don't initialize so we can setup the window.
|
||||||
emulator_ = std::make_unique<Emulator>(L"", L"");
|
emulator_ = std::make_unique<Emulator>(L"", L"", L"");
|
||||||
X_STATUS result = emulator_->Setup(
|
X_STATUS result = emulator_->Setup(
|
||||||
nullptr, nullptr, [this]() { return CreateGraphicsSystem(); }, nullptr);
|
nullptr, nullptr, [this]() { return CreateGraphicsSystem(); }, nullptr);
|
||||||
if (XFAILED(result)) {
|
if (XFAILED(result)) {
|
||||||
|
|
|
@ -122,7 +122,7 @@ bool TraceViewer::Setup() {
|
||||||
window_->Resize(1920, 1200);
|
window_->Resize(1920, 1200);
|
||||||
|
|
||||||
// Create the emulator but don't initialize so we can setup the window.
|
// Create the emulator but don't initialize so we can setup the window.
|
||||||
emulator_ = std::make_unique<Emulator>(L"", L"");
|
emulator_ = std::make_unique<Emulator>(L"", L"", L"");
|
||||||
X_STATUS result = emulator_->Setup(
|
X_STATUS result = emulator_->Setup(
|
||||||
window_.get(), nullptr, [this]() { return CreateGraphicsSystem(); },
|
window_.get(), nullptr, [this]() { return CreateGraphicsSystem(); },
|
||||||
nullptr);
|
nullptr);
|
||||||
|
|
Loading…
Reference in New Issue