Merge pull request #11298 from Pokechu22/vertexloader-no-DataReader

VertexLoader: Eliminate use of DataReader
This commit is contained in:
Mai 2022-11-23 04:40:53 +00:00 committed by GitHub
commit cb232155d9
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
16 changed files with 37 additions and 70 deletions

View File

@ -127,10 +127,8 @@ public:
// load vertices // load vertices
const u32 size = vertex_size * num_vertices; const u32 size = vertex_size * num_vertices;
// HACK
DataReader src{const_cast<u8*>(vertex_data), const_cast<u8*>(vertex_data) + size};
const u32 bytes = const u32 bytes =
VertexLoaderManager::RunVertices<is_preprocess>(vat, primitive, num_vertices, src); VertexLoaderManager::RunVertices<is_preprocess>(vat, primitive, num_vertices, vertex_data);
ASSERT(bytes == size); ASSERT(bytes == size);

View File

@ -6,7 +6,6 @@
#include "Common/Assert.h" #include "Common/Assert.h"
#include "Common/CommonTypes.h" #include "Common/CommonTypes.h"
#include "VideoCommon/DataReader.h"
#include "VideoCommon/VertexLoaderManager.h" #include "VideoCommon/VertexLoaderManager.h"
#include "VideoCommon/VertexLoaderUtils.h" #include "VideoCommon/VertexLoaderUtils.h"
#include "VideoCommon/VertexLoader_Color.h" #include "VideoCommon/VertexLoader_Color.h"
@ -16,7 +15,7 @@
#include "VideoCommon/VideoCommon.h" #include "VideoCommon/VideoCommon.h"
// This pointer is used as the source/dst for all fixed function loader calls // This pointer is used as the source/dst for all fixed function loader calls
u8* g_video_buffer_read_ptr; const u8* g_video_buffer_read_ptr;
u8* g_vertex_manager_write_ptr; u8* g_vertex_manager_write_ptr;
static void PosMtx_ReadDirect_UByte(VertexLoader* loader) static void PosMtx_ReadDirect_UByte(VertexLoader* loader)
@ -222,7 +221,7 @@ void VertexLoader::CompileVertexTranslator()
WriteCall(VertexLoader_TextCoord::GetDummyFunction()); // important to get indices right! WriteCall(VertexLoader_TextCoord::GetDummyFunction()); // important to get indices right!
break; break;
} }
else if (m_VtxDesc.low.TexMatIdx[i]) else if (m_VtxDesc.low.TexMatIdx[j])
{ {
has_more = true; has_more = true;
} }
@ -249,10 +248,10 @@ void VertexLoader::WriteCall(TPipelineFunction func)
m_PipelineStages[m_numPipelineStages++] = func; m_PipelineStages[m_numPipelineStages++] = func;
} }
int VertexLoader::RunVertices(DataReader src, DataReader dst, int count) int VertexLoader::RunVertices(const u8* src, u8* dst, int count)
{ {
g_vertex_manager_write_ptr = dst.GetPointer(); g_vertex_manager_write_ptr = dst;
g_video_buffer_read_ptr = src.GetPointer(); g_video_buffer_read_ptr = src;
m_numLoadedVertices += count; m_numLoadedVertices += count;
m_skippedVertices = 0; m_skippedVertices = 0;

View File

@ -11,7 +11,6 @@
#include "Common/CommonTypes.h" #include "Common/CommonTypes.h"
#include "VideoCommon/VertexLoaderBase.h" #include "VideoCommon/VertexLoaderBase.h"
class DataReader;
class VertexLoader; class VertexLoader;
typedef void (*TPipelineFunction)(VertexLoader* loader); typedef void (*TPipelineFunction)(VertexLoader* loader);
@ -20,7 +19,7 @@ class VertexLoader : public VertexLoaderBase
public: public:
VertexLoader(const TVtxDesc& vtx_desc, const VAT& vtx_attr); VertexLoader(const TVtxDesc& vtx_desc, const VAT& vtx_attr);
int RunVertices(DataReader src, DataReader dst, int count) override; int RunVertices(const u8* src, u8* dst, int count) override;
// They are used for the communication with the loader functions // They are used for the communication with the loader functions
float m_posScale; float m_posScale;
float m_tcScale[8]; float m_tcScale[8];

View File

@ -7,7 +7,6 @@
#include "Common/CommonTypes.h" #include "Common/CommonTypes.h"
#include "VideoCommon/CPMemory.h" #include "VideoCommon/CPMemory.h"
#include "VideoCommon/DataReader.h"
#include "VideoCommon/VertexLoaderManager.h" #include "VideoCommon/VertexLoaderManager.h"
using namespace Arm64Gen; using namespace Arm64Gen;
@ -517,9 +516,8 @@ void VertexLoaderARM64::GenerateVertexLoader()
m_native_vtx_decl.stride = m_dst_ofs; m_native_vtx_decl.stride = m_dst_ofs;
} }
int VertexLoaderARM64::RunVertices(DataReader src, DataReader dst, int count) int VertexLoaderARM64::RunVertices(const u8* src, u8* dst, int count)
{ {
m_numLoadedVertices += count; m_numLoadedVertices += count;
return ((int (*)(u8 * src, u8 * dst, int count)) region)(src.GetPointer(), dst.GetPointer(), return ((int (*)(const u8* src, u8* dst, int count))region)(src, dst, count - 1);
count - 1);
} }

View File

@ -9,7 +9,6 @@
#include "Common/CommonTypes.h" #include "Common/CommonTypes.h"
#include "VideoCommon/VertexLoaderBase.h" #include "VideoCommon/VertexLoaderBase.h"
class DataReader;
enum class VertexComponentFormat; enum class VertexComponentFormat;
enum class ComponentFormat; enum class ComponentFormat;
enum class ColorFormat; enum class ColorFormat;
@ -21,7 +20,7 @@ public:
VertexLoaderARM64(const TVtxDesc& vtx_desc, const VAT& vtx_att); VertexLoaderARM64(const TVtxDesc& vtx_desc, const VAT& vtx_att);
protected: protected:
int RunVertices(DataReader src, DataReader dst, int count) override; int RunVertices(const u8* src, u8* dst, int count) override;
private: private:
u32 m_src_ofs = 0; u32 m_src_ofs = 0;

View File

@ -17,7 +17,6 @@
#include "Common/Logging/Log.h" #include "Common/Logging/Log.h"
#include "Common/MsgHandler.h" #include "Common/MsgHandler.h"
#include "VideoCommon/DataReader.h"
#include "VideoCommon/VertexLoader.h" #include "VideoCommon/VertexLoader.h"
#include "VideoCommon/VertexLoader_Color.h" #include "VideoCommon/VertexLoader_Color.h"
#include "VideoCommon/VertexLoader_Normal.h" #include "VideoCommon/VertexLoader_Normal.h"
@ -57,15 +56,13 @@ public:
b->m_vertex_size, b->m_native_components, b->m_native_vtx_decl.stride); b->m_vertex_size, b->m_native_components, b->m_native_vtx_decl.stride);
} }
} }
int RunVertices(DataReader src, DataReader dst, int count) override int RunVertices(const u8* src, u8* dst, int count) override
{ {
buffer_a.resize(count * a->m_native_vtx_decl.stride + 4); buffer_a.resize(count * a->m_native_vtx_decl.stride + 4);
buffer_b.resize(count * b->m_native_vtx_decl.stride + 4); buffer_b.resize(count * b->m_native_vtx_decl.stride + 4);
int count_a = int count_a = a->RunVertices(src, buffer_a.data(), count);
a->RunVertices(src, DataReader(buffer_a.data(), buffer_a.data() + buffer_a.size()), count); int count_b = b->RunVertices(src, buffer_b.data(), count);
int count_b =
b->RunVertices(src, DataReader(buffer_b.data(), buffer_b.data() + buffer_b.size()), count);
if (count_a != count_b) if (count_a != count_b)
{ {
@ -84,7 +81,7 @@ public:
m_VtxDesc, m_VtxAttr); m_VtxDesc, m_VtxAttr);
} }
memcpy(dst.GetPointer(), buffer_a.data(), count_a * m_native_vtx_decl.stride); memcpy(dst, buffer_a.data(), count_a * m_native_vtx_decl.stride);
m_numLoadedVertices += count; m_numLoadedVertices += count;
return count_a; return count_a;
} }
@ -162,7 +159,7 @@ std::unique_ptr<VertexLoaderBase> VertexLoaderBase::CreateVertexLoader(const TVt
{ {
std::unique_ptr<VertexLoaderBase> loader = nullptr; std::unique_ptr<VertexLoaderBase> loader = nullptr;
//#define COMPARE_VERTEXLOADERS // #define COMPARE_VERTEXLOADERS
#if defined(_M_X86_64) #if defined(_M_X86_64)
loader = std::make_unique<VertexLoaderX64>(vtx_desc, vtx_attr); loader = std::make_unique<VertexLoaderX64>(vtx_desc, vtx_attr);

View File

@ -12,8 +12,6 @@
#include "VideoCommon/CPMemory.h" #include "VideoCommon/CPMemory.h"
#include "VideoCommon/NativeVertexFormat.h" #include "VideoCommon/NativeVertexFormat.h"
class DataReader;
class VertexLoaderUID class VertexLoaderUID
{ {
std::array<u32, 5> vid{}; std::array<u32, 5> vid{};
@ -65,7 +63,7 @@ public:
static std::unique_ptr<VertexLoaderBase> CreateVertexLoader(const TVtxDesc& vtx_desc, static std::unique_ptr<VertexLoaderBase> CreateVertexLoader(const TVtxDesc& vtx_desc,
const VAT& vtx_attr); const VAT& vtx_attr);
virtual ~VertexLoaderBase() {} virtual ~VertexLoaderBase() {}
virtual int RunVertices(DataReader src, DataReader dst, int count) = 0; virtual int RunVertices(const u8* src, u8* dst, int count) = 0;
// per loader public state // per loader public state
PortableVertexDeclaration m_native_vtx_decl{}; PortableVertexDeclaration m_native_vtx_decl{};

View File

@ -332,7 +332,7 @@ static void CheckCPConfiguration(int vtx_attr_group)
} }
template <bool IsPreprocess> template <bool IsPreprocess>
int RunVertices(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count, DataReader src) int RunVertices(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count, const u8* src)
{ {
if (count == 0) [[unlikely]] if (count == 0) [[unlikely]]
return 0; return 0;
@ -341,8 +341,6 @@ int RunVertices(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int coun
VertexLoaderBase* loader = RefreshLoader<IsPreprocess>(vtx_attr_group); VertexLoaderBase* loader = RefreshLoader<IsPreprocess>(vtx_attr_group);
int size = count * loader->m_vertex_size; int size = count * loader->m_vertex_size;
if ((int)src.size() < size) [[unlikely]]
return -1;
if constexpr (!IsPreprocess) if constexpr (!IsPreprocess)
{ {
@ -371,7 +369,7 @@ int RunVertices(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int coun
DataReader dst = g_vertex_manager->PrepareForAdditionalData( DataReader dst = g_vertex_manager->PrepareForAdditionalData(
primitive, count, loader->m_native_vtx_decl.stride, cullall); primitive, count, loader->m_native_vtx_decl.stride, cullall);
count = loader->RunVertices(src, dst, count); count = loader->RunVertices(src, dst.GetPointer(), count);
g_vertex_manager->AddIndices(primitive, count); g_vertex_manager->AddIndices(primitive, count);
g_vertex_manager->FlushData(count, loader->m_native_vtx_decl.stride); g_vertex_manager->FlushData(count, loader->m_native_vtx_decl.stride);
@ -383,9 +381,9 @@ int RunVertices(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int coun
} }
template int RunVertices<false>(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count, template int RunVertices<false>(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count,
DataReader src); const u8* src);
template int RunVertices<true>(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count, template int RunVertices<true>(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count,
DataReader src); const u8* src);
NativeVertexFormat* GetCurrentVertexFormat() NativeVertexFormat* GetCurrentVertexFormat()
{ {

View File

@ -12,7 +12,6 @@
#include "Common/EnumMap.h" #include "Common/EnumMap.h"
#include "VideoCommon/CPMemory.h" #include "VideoCommon/CPMemory.h"
class DataReader;
class NativeVertexFormat; class NativeVertexFormat;
struct PortableVertexDeclaration; struct PortableVertexDeclaration;
@ -43,7 +42,7 @@ NativeVertexFormat* GetUberVertexFormat(const PortableVertexDeclaration& decl);
// Returns -1 if buf_size is insufficient, else the amount of bytes consumed // Returns -1 if buf_size is insufficient, else the amount of bytes consumed
template <bool IsPreprocess = false> template <bool IsPreprocess = false>
int RunVertices(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count, DataReader src); int RunVertices(int vtx_attr_group, OpcodeDecoder::Primitive primitive, int count, const u8* src);
namespace detail namespace detail
{ {

View File

@ -7,8 +7,9 @@
#include "Common/CommonTypes.h" #include "Common/CommonTypes.h"
#include "Common/Inline.h" #include "Common/Inline.h"
#include "Common/Swap.h"
extern u8* g_video_buffer_read_ptr; extern const u8* g_video_buffer_read_ptr;
extern u8* g_vertex_manager_write_ptr; extern u8* g_vertex_manager_write_ptr;
DOLPHIN_FORCE_INLINE void DataSkip(u32 skip) DOLPHIN_FORCE_INLINE void DataSkip(u32 skip)
@ -24,7 +25,7 @@ DOLPHIN_FORCE_INLINE void DataSkip()
} }
template <typename T> template <typename T>
DOLPHIN_FORCE_INLINE T DataPeek(int _uOffset, u8* bufp = g_video_buffer_read_ptr) DOLPHIN_FORCE_INLINE T DataPeek(int _uOffset, const u8* bufp = g_video_buffer_read_ptr)
{ {
T result; T result;
std::memcpy(&result, &bufp[_uOffset], sizeof(T)); std::memcpy(&result, &bufp[_uOffset], sizeof(T));
@ -32,7 +33,7 @@ DOLPHIN_FORCE_INLINE T DataPeek(int _uOffset, u8* bufp = g_video_buffer_read_ptr
} }
template <typename T> template <typename T>
DOLPHIN_FORCE_INLINE T DataRead(u8** bufp = &g_video_buffer_read_ptr) DOLPHIN_FORCE_INLINE T DataRead(const u8** bufp = &g_video_buffer_read_ptr)
{ {
auto const result = DataPeek<T>(0, *bufp); auto const result = DataPeek<T>(0, *bufp);
*bufp += sizeof(T); *bufp += sizeof(T);
@ -47,7 +48,7 @@ DOLPHIN_FORCE_INLINE u32 DataReadU32Unswapped()
return result; return result;
} }
DOLPHIN_FORCE_INLINE u8* DataGetPosition() DOLPHIN_FORCE_INLINE const u8* DataGetPosition()
{ {
return g_video_buffer_read_ptr; return g_video_buffer_read_ptr;
} }

View File

@ -16,7 +16,6 @@
#include "Common/x64ABI.h" #include "Common/x64ABI.h"
#include "Common/x64Emitter.h" #include "Common/x64Emitter.h"
#include "VideoCommon/CPMemory.h" #include "VideoCommon/CPMemory.h"
#include "VideoCommon/DataReader.h"
#include "VideoCommon/VertexLoaderManager.h" #include "VideoCommon/VertexLoaderManager.h"
using namespace Gen; using namespace Gen;
@ -582,9 +581,9 @@ void VertexLoaderX64::GenerateVertexLoader()
m_native_vtx_decl.stride = m_dst_ofs; m_native_vtx_decl.stride = m_dst_ofs;
} }
int VertexLoaderX64::RunVertices(DataReader src, DataReader dst, int count) int VertexLoaderX64::RunVertices(const u8* src, u8* dst, int count)
{ {
m_numLoadedVertices += count; m_numLoadedVertices += count;
return ((int (*)(u8*, u8*, int, const void*))region)(src.GetPointer(), dst.GetPointer(), count, return ((int (*)(const u8* src, u8* dst, int count, const void* base))region)(src, dst, count,
memory_base_ptr); memory_base_ptr);
} }

View File

@ -18,7 +18,7 @@ public:
VertexLoaderX64(const TVtxDesc& vtx_desc, const VAT& vtx_att); VertexLoaderX64(const TVtxDesc& vtx_desc, const VAT& vtx_att);
protected: protected:
int RunVertices(DataReader src, DataReader dst, int count) override; int RunVertices(const u8* src, u8* dst, int count) override;
private: private:
u32 m_src_ofs = 0; u32 m_src_ofs = 0;

View File

@ -9,7 +9,6 @@
#include "Common/CommonTypes.h" #include "Common/CommonTypes.h"
#include "Common/EnumMap.h" #include "Common/EnumMap.h"
#include "VideoCommon/DataReader.h"
#include "VideoCommon/VertexLoader.h" #include "VideoCommon/VertexLoader.h"
#include "VideoCommon/VertexLoaderManager.h" #include "VideoCommon/VertexLoaderManager.h"
#include "VideoCommon/VertexLoaderUtils.h" #include "VideoCommon/VertexLoaderUtils.h"
@ -43,7 +42,6 @@ template <typename T, u32 N>
void ReadIndirect(VertexLoader* loader, const T* data) void ReadIndirect(VertexLoader* loader, const T* data)
{ {
static_assert(3 == N || 9 == N, "N is only sane as 3 or 9!"); static_assert(3 == N || 9 == N, "N is only sane as 3 or 9!");
DataReader dst(g_vertex_manager_write_ptr, nullptr);
for (u32 i = 0; i < N; ++i) for (u32 i = 0; i < N; ++i)
{ {
@ -55,10 +53,9 @@ void ReadIndirect(VertexLoader* loader, const T* data)
else if (i >= 6 && i < 9) else if (i >= 6 && i < 9)
VertexLoaderManager::binormal_cache[i - 6] = value; VertexLoaderManager::binormal_cache[i - 6] = value;
} }
dst.Write(value); DataWrite(value);
} }
g_vertex_manager_write_ptr = dst.GetPointer();
LOG_NORM(); LOG_NORM();
} }

View File

@ -10,7 +10,6 @@
#include "Common/EnumMap.h" #include "Common/EnumMap.h"
#include "Common/Swap.h" #include "Common/Swap.h"
#include "VideoCommon/DataReader.h"
#include "VideoCommon/VertexLoader.h" #include "VideoCommon/VertexLoader.h"
#include "VideoCommon/VertexLoaderManager.h" #include "VideoCommon/VertexLoaderManager.h"
#include "VideoCommon/VertexLoaderUtils.h" #include "VideoCommon/VertexLoaderUtils.h"
@ -35,19 +34,15 @@ void Pos_ReadDirect(VertexLoader* loader)
{ {
static_assert(N <= 3, "N > 3 is not sane!"); static_assert(N <= 3, "N > 3 is not sane!");
const auto scale = loader->m_posScale; const auto scale = loader->m_posScale;
DataReader dst(g_vertex_manager_write_ptr, nullptr);
DataReader src(g_video_buffer_read_ptr, nullptr);
for (int i = 0; i < N; ++i) for (int i = 0; i < N; ++i)
{ {
const float value = PosScale(src.Read<T>(), scale); const float value = PosScale(DataRead<T>(), scale);
if (loader->m_remaining < 3) if (loader->m_remaining < 3)
VertexLoaderManager::position_cache[loader->m_remaining][i] = value; VertexLoaderManager::position_cache[loader->m_remaining][i] = value;
dst.Write(value); DataWrite(value);
} }
g_vertex_manager_write_ptr = dst.GetPointer();
g_video_buffer_read_ptr = src.GetPointer();
LOG_VTX(); LOG_VTX();
} }
@ -63,17 +58,15 @@ void Pos_ReadIndex(VertexLoader* loader)
reinterpret_cast<const T*>(VertexLoaderManager::cached_arraybases[CPArray::Position] + reinterpret_cast<const T*>(VertexLoaderManager::cached_arraybases[CPArray::Position] +
(index * g_main_cp_state.array_strides[CPArray::Position])); (index * g_main_cp_state.array_strides[CPArray::Position]));
const auto scale = loader->m_posScale; const auto scale = loader->m_posScale;
DataReader dst(g_vertex_manager_write_ptr, nullptr);
for (int i = 0; i < N; ++i) for (int i = 0; i < N; ++i)
{ {
const float value = PosScale(Common::FromBigEndian(data[i]), scale); const float value = PosScale(Common::FromBigEndian(data[i]), scale);
if (loader->m_remaining < 3) if (loader->m_remaining < 3)
VertexLoaderManager::position_cache[loader->m_remaining][i] = value; VertexLoaderManager::position_cache[loader->m_remaining][i] = value;
dst.Write(value); DataWrite(value);
} }
g_vertex_manager_write_ptr = dst.GetPointer();
LOG_VTX(); LOG_VTX();
} }

View File

@ -8,7 +8,6 @@
#include "Common/CommonTypes.h" #include "Common/CommonTypes.h"
#include "Common/Swap.h" #include "Common/Swap.h"
#include "VideoCommon/DataReader.h"
#include "VideoCommon/VertexLoader.h" #include "VideoCommon/VertexLoader.h"
#include "VideoCommon/VertexLoaderManager.h" #include "VideoCommon/VertexLoaderManager.h"
#include "VideoCommon/VertexLoaderUtils.h" #include "VideoCommon/VertexLoaderUtils.h"
@ -36,14 +35,9 @@ template <typename T, int N>
void TexCoord_ReadDirect(VertexLoader* loader) void TexCoord_ReadDirect(VertexLoader* loader)
{ {
const auto scale = loader->m_tcScale[loader->m_tcIndex]; const auto scale = loader->m_tcScale[loader->m_tcIndex];
DataReader dst(g_vertex_manager_write_ptr, nullptr);
DataReader src(g_video_buffer_read_ptr, nullptr);
for (int i = 0; i != N; ++i) for (int i = 0; i != N; ++i)
dst.Write(TCScale(src.Read<T>(), scale)); DataWrite(TCScale(DataRead<T>(), scale));
g_vertex_manager_write_ptr = dst.GetPointer();
g_video_buffer_read_ptr = src.GetPointer();
++loader->m_tcIndex; ++loader->m_tcIndex;
} }
@ -58,12 +52,10 @@ void TexCoord_ReadIndex(VertexLoader* loader)
VertexLoaderManager::cached_arraybases[CPArray::TexCoord0 + loader->m_tcIndex] + VertexLoaderManager::cached_arraybases[CPArray::TexCoord0 + loader->m_tcIndex] +
(index * g_main_cp_state.array_strides[CPArray::TexCoord0 + loader->m_tcIndex])); (index * g_main_cp_state.array_strides[CPArray::TexCoord0 + loader->m_tcIndex]));
const auto scale = loader->m_tcScale[loader->m_tcIndex]; const auto scale = loader->m_tcScale[loader->m_tcIndex];
DataReader dst(g_vertex_manager_write_ptr, nullptr);
for (int i = 0; i != N; ++i) for (int i = 0; i != N; ++i)
dst.Write(TCScale(Common::FromBigEndian(data[i]), scale)); DataWrite(TCScale(Common::FromBigEndian(data[i]), scale));
g_vertex_manager_write_ptr = dst.GetPointer();
++loader->m_tcIndex; ++loader->m_tcIndex;
} }

View File

@ -91,7 +91,7 @@ protected:
if (expected_count == -1) if (expected_count == -1)
expected_count = count; expected_count = count;
ResetPointers(); ResetPointers();
int actual_count = m_loader->RunVertices(m_src, m_dst, count); int actual_count = m_loader->RunVertices(m_src.GetPointer(), m_dst.GetPointer(), count);
EXPECT_EQ(actual_count, expected_count); EXPECT_EQ(actual_count, expected_count);
} }