Merge branch 'master' into windows-unicode
This commit is contained in:
commit
2b1af36900
|
@ -29,6 +29,7 @@
|
||||||
|
|
||||||
#include <map>
|
#include <map>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
#include <list>
|
||||||
#include <deque>
|
#include <deque>
|
||||||
#include <string>
|
#include <string>
|
||||||
|
|
||||||
|
@ -45,7 +46,8 @@ struct LinkedListItem : public T
|
||||||
class PointerWrap
|
class PointerWrap
|
||||||
{
|
{
|
||||||
public:
|
public:
|
||||||
enum Mode {
|
enum Mode
|
||||||
|
{
|
||||||
MODE_READ = 1, // load
|
MODE_READ = 1, // load
|
||||||
MODE_WRITE, // save
|
MODE_WRITE, // save
|
||||||
MODE_MEASURE, // calculate size
|
MODE_MEASURE, // calculate size
|
||||||
|
@ -57,124 +59,95 @@ public:
|
||||||
|
|
||||||
public:
|
public:
|
||||||
PointerWrap(u8 **ptr_, Mode mode_) : ptr(ptr_), mode(mode_) {}
|
PointerWrap(u8 **ptr_, Mode mode_) : ptr(ptr_), mode(mode_) {}
|
||||||
PointerWrap(unsigned char **ptr_, int mode_) : ptr((u8**)ptr_), mode((Mode)mode_) {}
|
|
||||||
|
|
||||||
void SetMode(Mode mode_) {mode = mode_;}
|
void SetMode(Mode mode_) { mode = mode_; }
|
||||||
Mode GetMode() const {return mode;}
|
Mode GetMode() const { return mode; }
|
||||||
u8 **GetPPtr() {return ptr;}
|
u8** GetPPtr() { return ptr; }
|
||||||
|
|
||||||
void DoVoid(void *data, int size)
|
template <typename K, class V>
|
||||||
|
void Do(std::map<K, V>& x)
|
||||||
{
|
{
|
||||||
switch (mode) {
|
u32 count = (u32)x.size();
|
||||||
case MODE_READ: memcpy(data, *ptr, size); break;
|
Do(count);
|
||||||
case MODE_WRITE: memcpy(*ptr, data, size); break;
|
|
||||||
case MODE_MEASURE: break; // MODE_MEASURE - don't need to do anything
|
switch (mode)
|
||||||
case MODE_VERIFY: for(int i = 0; i < size; i++) _dbg_assert_msg_(COMMON, ((u8*)data)[i] == (*ptr)[i], "Savestate verification failure: %d (0x%X) (at %p) != %d (0x%X) (at %p).\n", ((u8*)data)[i], ((u8*)data)[i], &((u8*)data)[i], (*ptr)[i], (*ptr)[i], &(*ptr)[i]); break;
|
{
|
||||||
default: break; // throw an error?
|
|
||||||
}
|
|
||||||
(*ptr) += size;
|
|
||||||
}
|
|
||||||
|
|
||||||
template<class T>
|
|
||||||
void Do(std::map<unsigned int, T> &x)
|
|
||||||
{
|
|
||||||
unsigned int number = (unsigned int)x.size();
|
|
||||||
Do(number);
|
|
||||||
switch (mode) {
|
|
||||||
case MODE_READ:
|
case MODE_READ:
|
||||||
|
for (x.clear(); count != 0; --count)
|
||||||
{
|
{
|
||||||
x.clear();
|
std::pair<K, V> pair;
|
||||||
while (number > 0)
|
Do(pair.first);
|
||||||
{
|
Do(pair.second);
|
||||||
unsigned int first = 0;
|
x.insert(pair);
|
||||||
Do(first);
|
|
||||||
T second;
|
|
||||||
Do(second);
|
|
||||||
x[first] = second;
|
|
||||||
--number;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
|
|
||||||
case MODE_WRITE:
|
case MODE_WRITE:
|
||||||
case MODE_MEASURE:
|
case MODE_MEASURE:
|
||||||
case MODE_VERIFY:
|
case MODE_VERIFY:
|
||||||
|
for (auto itr = x.begin(); itr != x.end(); ++itr)
|
||||||
{
|
{
|
||||||
typename std::map<unsigned int, T>::iterator itr = x.begin();
|
Do(itr->first);
|
||||||
while (number > 0)
|
Do(itr->second);
|
||||||
{
|
|
||||||
Do(itr->first);
|
|
||||||
Do(itr->second);
|
|
||||||
--number;
|
|
||||||
++itr;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Store vectors.
|
|
||||||
template<class T>
|
|
||||||
void Do(std::vector<T> &x)
|
|
||||||
{
|
|
||||||
u32 vec_size = (u32)x.size();
|
|
||||||
Do(vec_size);
|
|
||||||
x.resize(vec_size);
|
|
||||||
DoArray(&x[0], vec_size);
|
|
||||||
}
|
|
||||||
|
|
||||||
// Store deques.
|
template <typename T>
|
||||||
template<class T>
|
void DoContainer(T& x)
|
||||||
void Do(std::deque<T> &x)
|
|
||||||
{
|
{
|
||||||
u32 deq_size = (u32)x.size();
|
u32 size = (u32)x.size();
|
||||||
Do(deq_size);
|
Do(size);
|
||||||
x.resize(deq_size);
|
x.resize(size);
|
||||||
u32 i;
|
|
||||||
for(i = 0; i < deq_size; i++)
|
|
||||||
DoVoid(&x[i],sizeof(T));
|
|
||||||
}
|
|
||||||
|
|
||||||
// Store strings.
|
|
||||||
void Do(std::string &x)
|
|
||||||
{
|
|
||||||
int stringLen = (int)x.length() + 1;
|
|
||||||
Do(stringLen);
|
|
||||||
|
|
||||||
switch (mode) {
|
for (auto itr = x.begin(); itr != x.end(); ++itr)
|
||||||
case MODE_READ: x = (char*)*ptr; break;
|
Do(*itr);
|
||||||
case MODE_WRITE: memcpy(*ptr, x.c_str(), stringLen); break;
|
|
||||||
case MODE_MEASURE: break;
|
|
||||||
case MODE_VERIFY: _dbg_assert_msg_(COMMON, !strcmp(x.c_str(), (char*)*ptr), "Savestate verification failure: \"%s\" != \"%s\" (at %p).\n", x.c_str(), (char*)*ptr, ptr); break;
|
|
||||||
}
|
|
||||||
(*ptr) += stringLen;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void Do(std::wstring &x)
|
template <typename T>
|
||||||
|
void Do(std::vector<T>& x)
|
||||||
{
|
{
|
||||||
int stringLen = sizeof(wchar_t)*((int)x.length() + 1);
|
DoContainer(x);
|
||||||
Do(stringLen);
|
}
|
||||||
|
|
||||||
switch (mode) {
|
template <typename T>
|
||||||
case MODE_READ: x.assign((wchar_t*)*ptr, (stringLen / sizeof(wchar_t)) - 1); break;
|
void Do(std::list<T>& x)
|
||||||
case MODE_WRITE: memcpy(*ptr, x.c_str(), stringLen); break;
|
{
|
||||||
case MODE_MEASURE: break;
|
DoContainer(x);
|
||||||
case MODE_VERIFY: _dbg_assert_msg_(COMMON, x == (wchar_t*)*ptr, "Savestate verification failure: \"%ls\" != \"%ls\" (at %p).\n", x.c_str(), (wchar_t*)*ptr, ptr); break;
|
}
|
||||||
}
|
|
||||||
(*ptr) += stringLen;
|
template <typename T>
|
||||||
|
void Do(std::deque<T>& x)
|
||||||
|
{
|
||||||
|
DoContainer(x);
|
||||||
|
}
|
||||||
|
|
||||||
|
template <typename T>
|
||||||
|
void Do(std::basic_string<T>& x)
|
||||||
|
{
|
||||||
|
DoContainer(x);
|
||||||
}
|
}
|
||||||
|
|
||||||
template<class T>
|
template <typename T>
|
||||||
void DoArray(T *x, int count) {
|
void DoArray(T* x, u32 count)
|
||||||
DoVoid((void *)x, sizeof(T) * count);
|
{
|
||||||
|
for (u32 i = 0; i != count; ++i)
|
||||||
|
Do(x[i]);
|
||||||
}
|
}
|
||||||
|
|
||||||
template<class T>
|
template <typename T>
|
||||||
void Do(T &x) {
|
void Do(T& x)
|
||||||
DoVoid((void *)&x, sizeof(x));
|
{
|
||||||
|
// TODO: Bad, Do(some_non_POD) will compile and fail at runtime
|
||||||
|
// type_traits are not fully supported everywhere yet
|
||||||
|
|
||||||
|
DoVoid((void*)&x, sizeof(x));
|
||||||
}
|
}
|
||||||
|
|
||||||
template<class T>
|
template <typename T>
|
||||||
void DoPointer(T* &x, T*const base) {
|
void DoPointer(T*& x, T* const base)
|
||||||
|
{
|
||||||
// pointers can be more than 2^31 apart, but you're using this function wrong if you need that much range
|
// pointers can be more than 2^31 apart, but you're using this function wrong if you need that much range
|
||||||
s32 offset = x - base;
|
s32 offset = x - base;
|
||||||
Do(offset);
|
Do(offset);
|
||||||
|
@ -182,7 +155,8 @@ public:
|
||||||
x = base + offset;
|
x = base + offset;
|
||||||
}
|
}
|
||||||
|
|
||||||
template<class T, LinkedListItem<T>* (*TNew)(), void (*TFree)(LinkedListItem<T>*), void (*TDo)(PointerWrap&, T*)>
|
// Let's pretend std::list doesn't exist!
|
||||||
|
template <class T, LinkedListItem<T>* (*TNew)(), void (*TFree)(LinkedListItem<T>*), void (*TDo)(PointerWrap&, T*)>
|
||||||
void DoLinkedList(LinkedListItem<T>*& list_start, LinkedListItem<T>** list_end=0)
|
void DoLinkedList(LinkedListItem<T>*& list_start, LinkedListItem<T>** list_end=0)
|
||||||
{
|
{
|
||||||
LinkedListItem<T>* list_cur = list_start;
|
LinkedListItem<T>* list_cur = list_start;
|
||||||
|
@ -242,25 +216,61 @@ public:
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void DoMarker(const char* prevName, u32 arbitraryNumber=0x42)
|
void DoMarker(const char* prevName, u32 arbitraryNumber = 0x42)
|
||||||
{
|
{
|
||||||
u32 cookie = arbitraryNumber;
|
u32 cookie = arbitraryNumber;
|
||||||
Do(cookie);
|
Do(cookie);
|
||||||
if(mode == PointerWrap::MODE_READ && cookie != arbitraryNumber)
|
|
||||||
|
if (mode == PointerWrap::MODE_READ && cookie != arbitraryNumber)
|
||||||
{
|
{
|
||||||
PanicAlertT("Error: After \"%s\", found %d (0x%X) instead of save marker %d (0x%X). Aborting savestate load...", prevName, cookie, cookie, arbitraryNumber, arbitraryNumber);
|
PanicAlertT("Error: After \"%s\", found %d (0x%X) instead of save marker %d (0x%X). Aborting savestate load...",
|
||||||
|
prevName, cookie, cookie, arbitraryNumber, arbitraryNumber);
|
||||||
mode = PointerWrap::MODE_MEASURE;
|
mode = PointerWrap::MODE_MEASURE;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
private:
|
||||||
|
__forceinline void DoByte(u8& x)
|
||||||
|
{
|
||||||
|
switch (mode)
|
||||||
|
{
|
||||||
|
case MODE_READ:
|
||||||
|
x = **ptr;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case MODE_WRITE:
|
||||||
|
**ptr = x;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case MODE_MEASURE:
|
||||||
|
break;
|
||||||
|
|
||||||
|
case MODE_VERIFY:
|
||||||
|
_dbg_assert_msg_(COMMON, (x == *ptr),
|
||||||
|
"Savestate verification failure: %d (0x%X) (at %p) != %d (0x%X) (at %p).\n",
|
||||||
|
x, x, &x, *ptr, *ptr, &*ptr);
|
||||||
|
break;
|
||||||
|
|
||||||
|
default:
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
++(*ptr);
|
||||||
|
}
|
||||||
|
|
||||||
|
void DoVoid(void *data, u32 size)
|
||||||
|
{
|
||||||
|
for(u32 i = 0; i != size; ++i)
|
||||||
|
DoByte(reinterpret_cast<u8*>(data)[i]);
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
||||||
class CChunkFileReader
|
class CChunkFileReader
|
||||||
{
|
{
|
||||||
public:
|
public:
|
||||||
// Load file template
|
// Load file template
|
||||||
template<class T>
|
template<class T>
|
||||||
static bool Load(const std::string& _rFilename, int _Revision, T& _class)
|
static bool Load(const std::string& _rFilename, u32 _Revision, T& _class)
|
||||||
{
|
{
|
||||||
INFO_LOG(COMMON, "ChunkReader: Loading %s" , _rFilename.c_str());
|
INFO_LOG(COMMON, "ChunkReader: Loading %s" , _rFilename.c_str());
|
||||||
|
|
||||||
|
@ -300,7 +310,7 @@ public:
|
||||||
}
|
}
|
||||||
|
|
||||||
// get size
|
// get size
|
||||||
const int sz = (int)(fileSize - headerSize);
|
const u32 sz = (u32)(fileSize - headerSize);
|
||||||
if (header.ExpectedSize != sz)
|
if (header.ExpectedSize != sz)
|
||||||
{
|
{
|
||||||
ERROR_LOG(COMMON,"ChunkReader: Bad file size, got %d expected %d",
|
ERROR_LOG(COMMON,"ChunkReader: Bad file size, got %d expected %d",
|
||||||
|
@ -309,17 +319,16 @@ public:
|
||||||
}
|
}
|
||||||
|
|
||||||
// read the state
|
// read the state
|
||||||
u8* buffer = new u8[sz];
|
std::vector<u8> buffer(sz);
|
||||||
if (!pFile.ReadBytes(buffer, sz))
|
if (!pFile.ReadArray(&buffer[0], sz))
|
||||||
{
|
{
|
||||||
ERROR_LOG(COMMON,"ChunkReader: Error reading file");
|
ERROR_LOG(COMMON,"ChunkReader: Error reading file");
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
u8 *ptr = buffer;
|
u8* ptr = &buffer[0];
|
||||||
PointerWrap p(&ptr, PointerWrap::MODE_READ);
|
PointerWrap p(&ptr, PointerWrap::MODE_READ);
|
||||||
_class.DoState(p);
|
_class.DoState(p);
|
||||||
delete[] buffer;
|
|
||||||
|
|
||||||
INFO_LOG(COMMON, "ChunkReader: Done loading %s" , _rFilename.c_str());
|
INFO_LOG(COMMON, "ChunkReader: Done loading %s" , _rFilename.c_str());
|
||||||
return true;
|
return true;
|
||||||
|
@ -327,7 +336,7 @@ public:
|
||||||
|
|
||||||
// Save file template
|
// Save file template
|
||||||
template<class T>
|
template<class T>
|
||||||
static bool Save(const std::string& _rFilename, int _Revision, T& _class)
|
static bool Save(const std::string& _rFilename, u32 _Revision, T& _class)
|
||||||
{
|
{
|
||||||
INFO_LOG(COMMON, "ChunkReader: Writing %s" , _rFilename.c_str());
|
INFO_LOG(COMMON, "ChunkReader: Writing %s" , _rFilename.c_str());
|
||||||
File::IOFile pFile(_rFilename, "wb");
|
File::IOFile pFile(_rFilename, "wb");
|
||||||
|
@ -349,9 +358,8 @@ public:
|
||||||
|
|
||||||
// Create header
|
// Create header
|
||||||
SChunkHeader header;
|
SChunkHeader header;
|
||||||
header.Compress = 0;
|
|
||||||
header.Revision = _Revision;
|
header.Revision = _Revision;
|
||||||
header.ExpectedSize = (int)sz;
|
header.ExpectedSize = (u32)sz;
|
||||||
|
|
||||||
// Write to file
|
// Write to file
|
||||||
if (!pFile.WriteArray(&header, 1))
|
if (!pFile.WriteArray(&header, 1))
|
||||||
|
@ -360,23 +368,21 @@ public:
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!pFile.WriteBytes(&buffer[0], sz))
|
if (!pFile.WriteArray(&buffer[0], sz))
|
||||||
{
|
{
|
||||||
ERROR_LOG(COMMON,"ChunkReader: Failed writing data");
|
ERROR_LOG(COMMON,"ChunkReader: Failed writing data");
|
||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
INFO_LOG(COMMON,"ChunkReader: Done writing %s",
|
INFO_LOG(COMMON,"ChunkReader: Done writing %s", _rFilename.c_str());
|
||||||
_rFilename.c_str());
|
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
private:
|
private:
|
||||||
struct SChunkHeader
|
struct SChunkHeader
|
||||||
{
|
{
|
||||||
int Revision;
|
u32 Revision;
|
||||||
int Compress;
|
u32 ExpectedSize;
|
||||||
int ExpectedSize;
|
|
||||||
};
|
};
|
||||||
};
|
};
|
||||||
|
|
||||||
|
|
|
@ -249,7 +249,7 @@ std::string ReplaceAll(std::string result, const std::string& src, const std::st
|
||||||
while(1)
|
while(1)
|
||||||
{
|
{
|
||||||
const int pos = result.find(src);
|
const int pos = result.find(src);
|
||||||
if (pos == 16) break;
|
if (pos == -1) break;
|
||||||
result.replace(pos, src.size(), dest);
|
result.replace(pos, src.size(), dest);
|
||||||
}
|
}
|
||||||
return result;
|
return result;
|
||||||
|
|
|
@ -22,6 +22,7 @@
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
|
||||||
#include "ChunkFile.h"
|
#include "ChunkFile.h"
|
||||||
|
#include "../../VideoCommon/Src/PerfQueryBase.h"
|
||||||
|
|
||||||
typedef void (*writeFn16)(const u16,const u32);
|
typedef void (*writeFn16)(const u16,const u32);
|
||||||
typedef void (*writeFn32)(const u32,const u32);
|
typedef void (*writeFn32)(const u32,const u32);
|
||||||
|
@ -107,6 +108,7 @@ public:
|
||||||
virtual void Video_EndField() = 0;
|
virtual void Video_EndField() = 0;
|
||||||
|
|
||||||
virtual u32 Video_AccessEFB(EFBAccessType, u32, u32, u32) = 0;
|
virtual u32 Video_AccessEFB(EFBAccessType, u32, u32, u32) = 0;
|
||||||
|
virtual u32 Video_GetQueryResult(PerfQueryType type) = 0;
|
||||||
|
|
||||||
virtual void Video_AddMessage(const char* pstr, unsigned int milliseconds) = 0;
|
virtual void Video_AddMessage(const char* pstr, unsigned int milliseconds) = 0;
|
||||||
virtual void Video_ClearMessages() = 0;
|
virtual void Video_ClearMessages() = 0;
|
||||||
|
@ -156,8 +158,10 @@ class VideoBackendHardware : public VideoBackend
|
||||||
void Video_ExitLoop();
|
void Video_ExitLoop();
|
||||||
void Video_BeginField(u32, FieldType, u32, u32);
|
void Video_BeginField(u32, FieldType, u32, u32);
|
||||||
void Video_EndField();
|
void Video_EndField();
|
||||||
u32 Video_AccessEFB(EFBAccessType, u32, u32, u32);
|
|
||||||
|
|
||||||
|
u32 Video_AccessEFB(EFBAccessType, u32, u32, u32);
|
||||||
|
u32 Video_GetQueryResult(PerfQueryType type);
|
||||||
|
|
||||||
void Video_AddMessage(const char* pstr, unsigned int milliseconds);
|
void Video_AddMessage(const char* pstr, unsigned int milliseconds);
|
||||||
void Video_ClearMessages();
|
void Video_ClearMessages();
|
||||||
bool Video_Screenshot(const char* filename);
|
bool Video_Screenshot(const char* filename);
|
||||||
|
|
|
@ -362,7 +362,11 @@ void SConfig::LoadSettings()
|
||||||
|
|
||||||
// Core
|
// Core
|
||||||
ini.Get("Core", "HLE_BS2", &m_LocalCoreStartupParameter.bHLE_BS2, false);
|
ini.Get("Core", "HLE_BS2", &m_LocalCoreStartupParameter.bHLE_BS2, false);
|
||||||
|
#ifdef _M_ARM
|
||||||
|
ini.Get("Core", "CPUCore", &m_LocalCoreStartupParameter.iCPUCore, 3);
|
||||||
|
#else
|
||||||
ini.Get("Core", "CPUCore", &m_LocalCoreStartupParameter.iCPUCore, 1);
|
ini.Get("Core", "CPUCore", &m_LocalCoreStartupParameter.iCPUCore, 1);
|
||||||
|
#endif
|
||||||
ini.Get("Core", "DSPThread", &m_LocalCoreStartupParameter.bDSPThread, false);
|
ini.Get("Core", "DSPThread", &m_LocalCoreStartupParameter.bDSPThread, false);
|
||||||
ini.Get("Core", "DSPHLE", &m_LocalCoreStartupParameter.bDSPHLE, true);
|
ini.Get("Core", "DSPHLE", &m_LocalCoreStartupParameter.bDSPHLE, true);
|
||||||
ini.Get("Core", "CPUThread", &m_LocalCoreStartupParameter.bCPUThread, true);
|
ini.Get("Core", "CPUThread", &m_LocalCoreStartupParameter.bCPUThread, true);
|
||||||
|
|
|
@ -133,7 +133,7 @@ unsigned int GetAttached()
|
||||||
// input/output: ptr
|
// input/output: ptr
|
||||||
// input: mode
|
// input: mode
|
||||||
//
|
//
|
||||||
void DoState(unsigned char **ptr, int mode)
|
void DoState(u8 **ptr, PointerWrap::Mode mode)
|
||||||
{
|
{
|
||||||
// TODO:
|
// TODO:
|
||||||
|
|
||||||
|
|
|
@ -3,6 +3,7 @@
|
||||||
#define _WIIMOTE_H_
|
#define _WIIMOTE_H_
|
||||||
|
|
||||||
#include "../../InputCommon/Src/InputConfig.h"
|
#include "../../InputCommon/Src/InputConfig.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
#define MAX_WIIMOTES 4
|
#define MAX_WIIMOTES 4
|
||||||
|
|
||||||
|
@ -25,7 +26,7 @@ void Shutdown();
|
||||||
void Initialize(void* const hwnd);
|
void Initialize(void* const hwnd);
|
||||||
|
|
||||||
unsigned int GetAttached();
|
unsigned int GetAttached();
|
||||||
void DoState(unsigned char **ptr, int mode);
|
void DoState(u8 **ptr, PointerWrap::Mode mode);
|
||||||
void EmuStateChange(EMUSTATE_CHANGE newState);
|
void EmuStateChange(EMUSTATE_CHANGE newState);
|
||||||
InputPlugin *GetPlugin();
|
InputPlugin *GetPlugin();
|
||||||
|
|
||||||
|
|
|
@ -58,6 +58,7 @@ typedef DWORD (__stdcall *PBth_BluetoothGetRadioInfo)(HANDLE, PBLUETOOTH_RADIO_I
|
||||||
typedef DWORD (__stdcall *PBth_BluetoothRemoveDevice)(const BLUETOOTH_ADDRESS*);
|
typedef DWORD (__stdcall *PBth_BluetoothRemoveDevice)(const BLUETOOTH_ADDRESS*);
|
||||||
typedef DWORD (__stdcall *PBth_BluetoothSetServiceState)(HANDLE, const BLUETOOTH_DEVICE_INFO*, const GUID*, DWORD);
|
typedef DWORD (__stdcall *PBth_BluetoothSetServiceState)(HANDLE, const BLUETOOTH_DEVICE_INFO*, const GUID*, DWORD);
|
||||||
typedef DWORD (__stdcall *PBth_BluetoothAuthenticateDevice)(HWND, HANDLE, BLUETOOTH_DEVICE_INFO*, PWCHAR, ULONG);
|
typedef DWORD (__stdcall *PBth_BluetoothAuthenticateDevice)(HWND, HANDLE, BLUETOOTH_DEVICE_INFO*, PWCHAR, ULONG);
|
||||||
|
typedef DWORD (__stdcall *PBth_BluetoothEnumerateInstalledServices)(HANDLE, BLUETOOTH_DEVICE_INFO*, DWORD*, GUID*);
|
||||||
|
|
||||||
PHidD_GetHidGuid HidD_GetHidGuid = NULL;
|
PHidD_GetHidGuid HidD_GetHidGuid = NULL;
|
||||||
PHidD_GetAttributes HidD_GetAttributes = NULL;
|
PHidD_GetAttributes HidD_GetAttributes = NULL;
|
||||||
|
@ -73,6 +74,7 @@ PBth_BluetoothGetRadioInfo Bth_BluetoothGetRadioInfo = NULL;
|
||||||
PBth_BluetoothRemoveDevice Bth_BluetoothRemoveDevice = NULL;
|
PBth_BluetoothRemoveDevice Bth_BluetoothRemoveDevice = NULL;
|
||||||
PBth_BluetoothSetServiceState Bth_BluetoothSetServiceState = NULL;
|
PBth_BluetoothSetServiceState Bth_BluetoothSetServiceState = NULL;
|
||||||
PBth_BluetoothAuthenticateDevice Bth_BluetoothAuthenticateDevice = NULL;
|
PBth_BluetoothAuthenticateDevice Bth_BluetoothAuthenticateDevice = NULL;
|
||||||
|
PBth_BluetoothEnumerateInstalledServices Bth_BluetoothEnumerateInstalledServices = NULL;
|
||||||
|
|
||||||
HINSTANCE hid_lib = NULL;
|
HINSTANCE hid_lib = NULL;
|
||||||
HINSTANCE bthprops_lib = NULL;
|
HINSTANCE bthprops_lib = NULL;
|
||||||
|
@ -118,12 +120,14 @@ inline void init_lib()
|
||||||
Bth_BluetoothRemoveDevice = (PBth_BluetoothRemoveDevice)GetProcAddress(bthprops_lib, "BluetoothRemoveDevice");
|
Bth_BluetoothRemoveDevice = (PBth_BluetoothRemoveDevice)GetProcAddress(bthprops_lib, "BluetoothRemoveDevice");
|
||||||
Bth_BluetoothSetServiceState = (PBth_BluetoothSetServiceState)GetProcAddress(bthprops_lib, "BluetoothSetServiceState");
|
Bth_BluetoothSetServiceState = (PBth_BluetoothSetServiceState)GetProcAddress(bthprops_lib, "BluetoothSetServiceState");
|
||||||
Bth_BluetoothAuthenticateDevice = (PBth_BluetoothAuthenticateDevice)GetProcAddress(bthprops_lib, "BluetoothAuthenticateDevice");
|
Bth_BluetoothAuthenticateDevice = (PBth_BluetoothAuthenticateDevice)GetProcAddress(bthprops_lib, "BluetoothAuthenticateDevice");
|
||||||
|
Bth_BluetoothEnumerateInstalledServices = (PBth_BluetoothEnumerateInstalledServices)GetProcAddress(bthprops_lib, "BluetoothEnumerateInstalledServices");
|
||||||
|
|
||||||
if (!Bth_BluetoothFindDeviceClose || !Bth_BluetoothFindFirstDevice ||
|
if (!Bth_BluetoothFindDeviceClose || !Bth_BluetoothFindFirstDevice ||
|
||||||
!Bth_BluetoothFindFirstRadio || !Bth_BluetoothFindNextDevice ||
|
!Bth_BluetoothFindFirstRadio || !Bth_BluetoothFindNextDevice ||
|
||||||
!Bth_BluetoothFindNextRadio || !Bth_BluetoothFindRadioClose ||
|
!Bth_BluetoothFindNextRadio || !Bth_BluetoothFindRadioClose ||
|
||||||
!Bth_BluetoothGetRadioInfo || !Bth_BluetoothRemoveDevice ||
|
!Bth_BluetoothGetRadioInfo || !Bth_BluetoothRemoveDevice ||
|
||||||
!Bth_BluetoothSetServiceState || !Bth_BluetoothAuthenticateDevice)
|
!Bth_BluetoothSetServiceState || !Bth_BluetoothAuthenticateDevice ||
|
||||||
|
!Bth_BluetoothEnumerateInstalledServices)
|
||||||
{
|
{
|
||||||
PanicAlertT("Failed to load bthprops.cpl");
|
PanicAlertT("Failed to load bthprops.cpl");
|
||||||
exit(EXIT_FAILURE);
|
exit(EXIT_FAILURE);
|
||||||
|
@ -556,6 +560,14 @@ bool AttachWiimote(HANDLE hRadio, const BLUETOOTH_RADIO_INFO& radio_info, BLUETO
|
||||||
|
|
||||||
if (ERROR_SUCCESS != auth_result)
|
if (ERROR_SUCCESS != auth_result)
|
||||||
ERROR_LOG(WIIMOTE, "AttachWiimote: BluetoothAuthenticateDevice returned %08x", auth_result);
|
ERROR_LOG(WIIMOTE, "AttachWiimote: BluetoothAuthenticateDevice returned %08x", auth_result);
|
||||||
|
|
||||||
|
DWORD pcServices = 16;
|
||||||
|
GUID guids[16];
|
||||||
|
// If this is not done, the Wii device will not remember the pairing
|
||||||
|
const DWORD srv_result = Bth_BluetoothEnumerateInstalledServices(hRadio, &btdi, &pcServices, guids);
|
||||||
|
|
||||||
|
if (ERROR_SUCCESS != srv_result)
|
||||||
|
ERROR_LOG(WIIMOTE, "AttachWiimote: BluetoothEnumerateInstalledServices returned %08x", srv_result);
|
||||||
#endif
|
#endif
|
||||||
// Activate service
|
// Activate service
|
||||||
const DWORD hr = Bth_BluetoothSetServiceState(hRadio, &btdi,
|
const DWORD hr = Bth_BluetoothSetServiceState(hRadio, &btdi,
|
||||||
|
|
|
@ -71,7 +71,7 @@ static Common::Event g_compressAndDumpStateSyncEvent;
|
||||||
static std::thread g_save_thread;
|
static std::thread g_save_thread;
|
||||||
|
|
||||||
// Don't forget to increase this after doing changes on the savestate system
|
// Don't forget to increase this after doing changes on the savestate system
|
||||||
static const u32 STATE_VERSION = 14;
|
static const u32 STATE_VERSION = 16;
|
||||||
|
|
||||||
struct StateHeader
|
struct StateHeader
|
||||||
{
|
{
|
||||||
|
|
|
@ -49,7 +49,8 @@ WiiWAD::WiiWAD(const std::string& _rName)
|
||||||
if (pReader == NULL || File::IsDirectory(_rName))
|
if (pReader == NULL || File::IsDirectory(_rName))
|
||||||
{
|
{
|
||||||
m_Valid = false;
|
m_Valid = false;
|
||||||
return;
|
if(pReader) delete pReader;
|
||||||
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
m_Valid = ParseWAD(*pReader);
|
m_Valid = ParseWAD(*pReader);
|
||||||
|
|
|
@ -247,7 +247,7 @@ wxTextCtrl* CLogWindow::CreateTextCtrl(wxPanel* parent, wxWindowID id, long Styl
|
||||||
#else
|
#else
|
||||||
TC->SetBackgroundColour(*wxBLACK);
|
TC->SetBackgroundColour(*wxBLACK);
|
||||||
#endif
|
#endif
|
||||||
if (m_FontChoice && m_FontChoice->GetSelection() < (int)LogFont.size())
|
if (m_FontChoice && m_FontChoice->GetSelection() < (int)LogFont.size() && m_FontChoice->GetSelection() >= 0)
|
||||||
TC->SetDefaultStyle(wxTextAttr(wxNullColour, wxNullColour, LogFont[m_FontChoice->GetSelection()]));
|
TC->SetDefaultStyle(wxTextAttr(wxNullColour, wxNullColour, LogFont[m_FontChoice->GetSelection()]));
|
||||||
|
|
||||||
return TC;
|
return TC;
|
||||||
|
|
|
@ -69,6 +69,7 @@ bool Keyboard::UpdateInput()
|
||||||
CGRectMakeWithDictionaryRepresentation(boundsDictionary, &bounds);
|
CGRectMakeWithDictionaryRepresentation(boundsDictionary, &bounds);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
CFRelease(windowDescriptions);
|
||||||
CFRelease(windowArray);
|
CFRelease(windowArray);
|
||||||
|
|
||||||
CGEventRef event = CGEventCreate(nil);
|
CGEventRef event = CGEventCreate(nil);
|
||||||
|
|
|
@ -16,6 +16,7 @@ set(SRCS Src/BPFunctions.cpp
|
||||||
Src/OpcodeDecoding.cpp
|
Src/OpcodeDecoding.cpp
|
||||||
Src/OpenCL.cpp
|
Src/OpenCL.cpp
|
||||||
Src/OpenCL/OCLTextureDecoder.cpp
|
Src/OpenCL/OCLTextureDecoder.cpp
|
||||||
|
Src/PerfQueryBase.cpp
|
||||||
Src/PixelEngine.cpp
|
Src/PixelEngine.cpp
|
||||||
Src/PixelShaderGen.cpp
|
Src/PixelShaderGen.cpp
|
||||||
Src/PixelShaderManager.cpp
|
Src/PixelShaderManager.cpp
|
||||||
|
|
|
@ -62,7 +62,7 @@
|
||||||
#define BPMEM_COPYFILTER1 0x54
|
#define BPMEM_COPYFILTER1 0x54
|
||||||
#define BPMEM_CLEARBBOX1 0x55
|
#define BPMEM_CLEARBBOX1 0x55
|
||||||
#define BPMEM_CLEARBBOX2 0x56
|
#define BPMEM_CLEARBBOX2 0x56
|
||||||
#define BPMEM_UNKNOWN_57 0x57
|
#define BPMEM_CLEAR_PIXEL_PERF 0x57
|
||||||
#define BPMEM_REVBITS 0x58
|
#define BPMEM_REVBITS 0x58
|
||||||
#define BPMEM_SCISSOROFFSET 0x59
|
#define BPMEM_SCISSOROFFSET 0x59
|
||||||
#define BPMEM_PRELOAD_ADDR 0x60
|
#define BPMEM_PRELOAD_ADDR 0x60
|
||||||
|
|
|
@ -31,6 +31,7 @@
|
||||||
#include "VertexShaderManager.h"
|
#include "VertexShaderManager.h"
|
||||||
#include "Thread.h"
|
#include "Thread.h"
|
||||||
#include "HW/Memmap.h"
|
#include "HW/Memmap.h"
|
||||||
|
#include "PerfQueryBase.h"
|
||||||
|
|
||||||
using namespace BPFunctions;
|
using namespace BPFunctions;
|
||||||
|
|
||||||
|
@ -62,7 +63,6 @@ void RenderToXFB(const BPCmd &bp, const EFBRectangle &rc, float yScale, float xf
|
||||||
{
|
{
|
||||||
Renderer::RenderToXFB(xfbAddr, dstWidth, dstHeight, rc, gamma);
|
Renderer::RenderToXFB(xfbAddr, dstWidth, dstHeight, rc, gamma);
|
||||||
}
|
}
|
||||||
|
|
||||||
void BPWritten(const BPCmd& bp)
|
void BPWritten(const BPCmd& bp)
|
||||||
{
|
{
|
||||||
/*
|
/*
|
||||||
|
@ -144,7 +144,8 @@ void BPWritten(const BPCmd& bp)
|
||||||
|| bp.address == BPMEM_LOADTLUT0
|
|| bp.address == BPMEM_LOADTLUT0
|
||||||
|| bp.address == BPMEM_LOADTLUT1
|
|| bp.address == BPMEM_LOADTLUT1
|
||||||
|| bp.address == BPMEM_TEXINVALIDATE
|
|| bp.address == BPMEM_TEXINVALIDATE
|
||||||
|| bp.address == BPMEM_PRELOAD_MODE))
|
|| bp.address == BPMEM_PRELOAD_MODE
|
||||||
|
|| bp.address == BPMEM_CLEAR_PIXEL_PERF))
|
||||||
{
|
{
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
@ -484,9 +485,10 @@ void BPWritten(const BPCmd& bp)
|
||||||
case BPMEM_IND_IMASK: // Index Mask ?
|
case BPMEM_IND_IMASK: // Index Mask ?
|
||||||
case BPMEM_REVBITS: // Always set to 0x0F when GX_InitRevBits() is called.
|
case BPMEM_REVBITS: // Always set to 0x0F when GX_InitRevBits() is called.
|
||||||
break;
|
break;
|
||||||
|
|
||||||
case BPMEM_UNKNOWN_57: // Sunshine alternates this register between values 0x000 and 0xAAA
|
case BPMEM_CLEAR_PIXEL_PERF:
|
||||||
DEBUG_LOG(VIDEO, "Unknown BP Reg 0x57: %08x", bp.newvalue);
|
// GXClearPixMetric writes 0xAAA here, Sunshine alternates this register between values 0x000 and 0xAAA
|
||||||
|
g_perf_query->ResetQuery();
|
||||||
break;
|
break;
|
||||||
|
|
||||||
case BPMEM_PRELOAD_ADDR:
|
case BPMEM_PRELOAD_ADDR:
|
||||||
|
|
|
@ -21,6 +21,10 @@ volatile u32 s_swapRequested = false;
|
||||||
u32 s_efbAccessRequested = false;
|
u32 s_efbAccessRequested = false;
|
||||||
volatile u32 s_FifoShuttingDown = false;
|
volatile u32 s_FifoShuttingDown = false;
|
||||||
|
|
||||||
|
std::condition_variable s_perf_query_cond;
|
||||||
|
std::mutex s_perf_query_lock;
|
||||||
|
static volatile bool s_perf_query_requested;
|
||||||
|
|
||||||
static volatile struct
|
static volatile struct
|
||||||
{
|
{
|
||||||
u32 xfbAddr;
|
u32 xfbAddr;
|
||||||
|
@ -169,6 +173,43 @@ u32 VideoBackendHardware::Video_AccessEFB(EFBAccessType type, u32 x, u32 y, u32
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static bool QueryResultIsReady()
|
||||||
|
{
|
||||||
|
return !s_perf_query_requested || s_FifoShuttingDown;
|
||||||
|
}
|
||||||
|
|
||||||
|
void VideoFifo_CheckPerfQueryRequest()
|
||||||
|
{
|
||||||
|
if (s_perf_query_requested)
|
||||||
|
{
|
||||||
|
g_perf_query->FlushResults();
|
||||||
|
|
||||||
|
{
|
||||||
|
std::lock_guard<std::mutex> lk(s_perf_query_lock);
|
||||||
|
s_perf_query_requested = false;
|
||||||
|
}
|
||||||
|
|
||||||
|
s_perf_query_cond.notify_one();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
u32 VideoBackendHardware::Video_GetQueryResult(PerfQueryType type)
|
||||||
|
{
|
||||||
|
// TODO: Is this check sane?
|
||||||
|
if (!g_perf_query->IsFlushed())
|
||||||
|
{
|
||||||
|
if (SConfig::GetInstance().m_LocalCoreStartupParameter.bCPUThread)
|
||||||
|
{
|
||||||
|
s_perf_query_requested = true;
|
||||||
|
std::unique_lock<std::mutex> lk(s_perf_query_lock);
|
||||||
|
s_perf_query_cond.wait(lk, QueryResultIsReady);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
g_perf_query->FlushResults();
|
||||||
|
}
|
||||||
|
|
||||||
|
return g_perf_query->GetQueryResult(type);
|
||||||
|
}
|
||||||
|
|
||||||
void VideoBackendHardware::InitializeShared()
|
void VideoBackendHardware::InitializeShared()
|
||||||
{
|
{
|
||||||
|
@ -176,6 +217,7 @@ void VideoBackendHardware::InitializeShared()
|
||||||
|
|
||||||
s_swapRequested = 0;
|
s_swapRequested = 0;
|
||||||
s_efbAccessRequested = 0;
|
s_efbAccessRequested = 0;
|
||||||
|
s_perf_query_requested = false;
|
||||||
s_FifoShuttingDown = 0;
|
s_FifoShuttingDown = 0;
|
||||||
memset((void*)&s_beginFieldArgs, 0, sizeof(s_beginFieldArgs));
|
memset((void*)&s_beginFieldArgs, 0, sizeof(s_beginFieldArgs));
|
||||||
memset(&s_accessEFBArgs, 0, sizeof(s_accessEFBArgs));
|
memset(&s_accessEFBArgs, 0, sizeof(s_accessEFBArgs));
|
||||||
|
@ -186,6 +228,11 @@ void VideoBackendHardware::InitializeShared()
|
||||||
// Run from the CPU thread
|
// Run from the CPU thread
|
||||||
void VideoBackendHardware::DoState(PointerWrap& p)
|
void VideoBackendHardware::DoState(PointerWrap& p)
|
||||||
{
|
{
|
||||||
|
bool software = false;
|
||||||
|
p.Do(software);
|
||||||
|
if (p.GetMode() == PointerWrap::MODE_READ && software == true)
|
||||||
|
// change mode to abort load of incompatible save state.
|
||||||
|
p.SetMode(PointerWrap::MODE_VERIFY);
|
||||||
VideoCommon_DoState(p);
|
VideoCommon_DoState(p);
|
||||||
p.DoMarker("VideoCommon");
|
p.DoMarker("VideoCommon");
|
||||||
|
|
||||||
|
@ -233,6 +280,7 @@ void VideoFifo_CheckAsyncRequest()
|
||||||
{
|
{
|
||||||
VideoFifo_CheckSwapRequest();
|
VideoFifo_CheckSwapRequest();
|
||||||
VideoFifo_CheckEFBAccess();
|
VideoFifo_CheckEFBAccess();
|
||||||
|
VideoFifo_CheckPerfQueryRequest();
|
||||||
}
|
}
|
||||||
|
|
||||||
void VideoBackendHardware::Video_GatherPipeBursted()
|
void VideoBackendHardware::Video_GatherPipeBursted()
|
||||||
|
|
|
@ -22,7 +22,7 @@ namespace OSD
|
||||||
{
|
{
|
||||||
|
|
||||||
// On-screen message display
|
// On-screen message display
|
||||||
void AddMessage(const char* str, u32 ms);
|
void AddMessage(const char* str, u32 ms = 2000);
|
||||||
void DrawMessages(); // draw the current messages on the screen. Only call once per frame.
|
void DrawMessages(); // draw the current messages on the screen. Only call once per frame.
|
||||||
void ClearMessages();
|
void ClearMessages();
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,3 @@
|
||||||
|
#include "PerfQueryBase.h"
|
||||||
|
|
||||||
|
PerfQueryBase* g_perf_query = 0;
|
|
@ -0,0 +1,54 @@
|
||||||
|
#ifndef _PERFQUERY_BASE_H_
|
||||||
|
#define _PERFQUERY_BASE_H_
|
||||||
|
|
||||||
|
#include "CommonTypes.h"
|
||||||
|
|
||||||
|
enum PerfQueryType
|
||||||
|
{
|
||||||
|
PQ_ZCOMP_INPUT_ZCOMPLOC = 0,
|
||||||
|
PQ_ZCOMP_OUTPUT_ZCOMPLOC,
|
||||||
|
PQ_ZCOMP_INPUT,
|
||||||
|
PQ_ZCOMP_OUTPUT,
|
||||||
|
PQ_BLEND_INPUT,
|
||||||
|
PQ_EFB_COPY_CLOCKS,
|
||||||
|
PQ_NUM_MEMBERS
|
||||||
|
};
|
||||||
|
|
||||||
|
enum PerfQueryGroup
|
||||||
|
{
|
||||||
|
PQG_ZCOMP_ZCOMPLOC,
|
||||||
|
PQG_ZCOMP,
|
||||||
|
PQG_EFB_COPY_CLOCKS,
|
||||||
|
PQG_NUM_MEMBERS,
|
||||||
|
};
|
||||||
|
|
||||||
|
class PerfQueryBase
|
||||||
|
{
|
||||||
|
public:
|
||||||
|
PerfQueryBase() {};
|
||||||
|
virtual ~PerfQueryBase() {}
|
||||||
|
|
||||||
|
// Begin querying the specified value for the following host GPU commands
|
||||||
|
virtual void EnableQuery(PerfQueryGroup type) {}
|
||||||
|
|
||||||
|
// Stop querying the specified value for the following host GPU commands
|
||||||
|
virtual void DisableQuery(PerfQueryGroup type) {}
|
||||||
|
|
||||||
|
// Reset query counters to zero and drop any pending queries
|
||||||
|
virtual void ResetQuery() {}
|
||||||
|
|
||||||
|
// Return the measured value for the specified query type
|
||||||
|
// NOTE: Called from CPU thread
|
||||||
|
virtual u32 GetQueryResult(PerfQueryType type) { return 0; }
|
||||||
|
|
||||||
|
// Request the value of any pending queries - causes a pipeline flush and thus should be used carefully!
|
||||||
|
virtual void FlushResults() {}
|
||||||
|
|
||||||
|
// True if there are no further pending query results
|
||||||
|
// NOTE: Called from CPU thread
|
||||||
|
virtual bool IsFlushed() const { return true; }
|
||||||
|
};
|
||||||
|
|
||||||
|
extern PerfQueryBase* g_perf_query;
|
||||||
|
|
||||||
|
#endif // _PERFQUERY_H_
|
|
@ -28,10 +28,13 @@
|
||||||
#include "ConfigManager.h"
|
#include "ConfigManager.h"
|
||||||
|
|
||||||
#include "PixelEngine.h"
|
#include "PixelEngine.h"
|
||||||
|
#include "RenderBase.h"
|
||||||
#include "CommandProcessor.h"
|
#include "CommandProcessor.h"
|
||||||
#include "HW/ProcessorInterface.h"
|
#include "HW/ProcessorInterface.h"
|
||||||
#include "DLCache.h"
|
#include "DLCache.h"
|
||||||
#include "State.h"
|
#include "State.h"
|
||||||
|
#include "PerfQueryBase.h"
|
||||||
|
|
||||||
namespace PixelEngine
|
namespace PixelEngine
|
||||||
{
|
{
|
||||||
|
|
||||||
|
@ -255,23 +258,59 @@ void Read16(u16& _uReturnValue, const u32 _iAddress)
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
case PE_PERF_0L:
|
// NOTE(neobrain): only PE_PERF_ZCOMP_OUTPUT is implemented in D3D11, but the other values shouldn't be contradictionary to the value of that register (i.e. INPUT registers should always be greater or equal to their corresponding OUTPUT registers).
|
||||||
case PE_PERF_0H:
|
case PE_PERF_ZCOMP_INPUT_ZCOMPLOC_L:
|
||||||
case PE_PERF_1L:
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_INPUT_ZCOMPLOC) & 0xFFFF;
|
||||||
case PE_PERF_1H:
|
break;
|
||||||
case PE_PERF_2L:
|
|
||||||
case PE_PERF_2H:
|
case PE_PERF_ZCOMP_INPUT_ZCOMPLOC_H:
|
||||||
case PE_PERF_3L:
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_INPUT_ZCOMPLOC) >> 16;
|
||||||
case PE_PERF_3H:
|
break;
|
||||||
case PE_PERF_4L:
|
|
||||||
case PE_PERF_4H:
|
case PE_PERF_ZCOMP_OUTPUT_ZCOMPLOC_L:
|
||||||
case PE_PERF_5L:
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_OUTPUT_ZCOMPLOC) & 0xFFFF;
|
||||||
case PE_PERF_5H:
|
break;
|
||||||
INFO_LOG(PIXELENGINE, "(r16) perf counter @ %08x", _iAddress);
|
|
||||||
// git r90a2096a24f4 (svn r3663) added the PE_PERF cases, without setting
|
case PE_PERF_ZCOMP_OUTPUT_ZCOMPLOC_H:
|
||||||
// _uReturnValue to anything, this reverts to the previous behaviour which allows
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_OUTPUT_ZCOMPLOC) >> 16;
|
||||||
// The timer in SMS:Scrubbing Serena Beach to countdown correctly
|
break;
|
||||||
_uReturnValue = 1;
|
|
||||||
|
case PE_PERF_ZCOMP_INPUT_L:
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_INPUT) & 0xFFFF;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case PE_PERF_ZCOMP_INPUT_H:
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_INPUT) >> 16;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case PE_PERF_ZCOMP_OUTPUT_L:
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_OUTPUT) & 0xFFFF;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case PE_PERF_ZCOMP_OUTPUT_H:
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_ZCOMP_OUTPUT) >> 16;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case PE_PERF_BLEND_INPUT_L:
|
||||||
|
// Super Mario Sunshine uses this register in episode 6 of Sirena Beach:
|
||||||
|
// The amount of remaining goop is determined by checking how many pixels reach the blending stage.
|
||||||
|
// Once this register falls below a particular value (around 0x90), the game regards the challenge finished.
|
||||||
|
// In very old builds, Dolphin only returned 0. That caused the challenge to be immediately finished without any goop being cleaned (the timer just didn't even start counting from 3:00:00).
|
||||||
|
// Later builds returned 1 for the high register. That caused the timer to actually count down, but made the challenge unbeatable because the game always thought you didn't clear any goop at all.
|
||||||
|
// Note that currently this functionality is only implemented in the D3D11 backend.
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_BLEND_INPUT) & 0xFFFF;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case PE_PERF_BLEND_INPUT_H:
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_BLEND_INPUT) >> 16;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case PE_PERF_EFB_COPY_CLOCKS_L:
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_EFB_COPY_CLOCKS) & 0xFFFF;
|
||||||
|
break;
|
||||||
|
|
||||||
|
case PE_PERF_EFB_COPY_CLOCKS_H:
|
||||||
|
_uReturnValue = g_video_backend->Video_GetQueryResult(PQ_EFB_COPY_CLOCKS) >> 16;
|
||||||
break;
|
break;
|
||||||
|
|
||||||
default:
|
default:
|
||||||
|
|
|
@ -36,19 +36,20 @@ enum
|
||||||
PE_BBOX_TOP = 0x14, // Flip Top
|
PE_BBOX_TOP = 0x14, // Flip Top
|
||||||
PE_BBOX_BOTTOM = 0x16, // Flip Bottom
|
PE_BBOX_BOTTOM = 0x16, // Flip Bottom
|
||||||
|
|
||||||
// These have not yet been RE:d. They are the perf counters.
|
// NOTE: Order not verified
|
||||||
PE_PERF_0L = 0x18,
|
// These indicate the number of quads that are being used as input/output for each particular stage
|
||||||
PE_PERF_0H = 0x1a,
|
PE_PERF_ZCOMP_INPUT_ZCOMPLOC_L = 0x18,
|
||||||
PE_PERF_1L = 0x1c,
|
PE_PERF_ZCOMP_INPUT_ZCOMPLOC_H = 0x1a,
|
||||||
PE_PERF_1H = 0x1e,
|
PE_PERF_ZCOMP_OUTPUT_ZCOMPLOC_L = 0x1c,
|
||||||
PE_PERF_2L = 0x20,
|
PE_PERF_ZCOMP_OUTPUT_ZCOMPLOC_H = 0x1e,
|
||||||
PE_PERF_2H = 0x22,
|
PE_PERF_ZCOMP_INPUT_L = 0x20,
|
||||||
PE_PERF_3L = 0x24,
|
PE_PERF_ZCOMP_INPUT_H = 0x22,
|
||||||
PE_PERF_3H = 0x26,
|
PE_PERF_ZCOMP_OUTPUT_L = 0x24,
|
||||||
PE_PERF_4L = 0x28,
|
PE_PERF_ZCOMP_OUTPUT_H = 0x26,
|
||||||
PE_PERF_4H = 0x2a,
|
PE_PERF_BLEND_INPUT_L = 0x28,
|
||||||
PE_PERF_5L = 0x2c,
|
PE_PERF_BLEND_INPUT_H = 0x2a,
|
||||||
PE_PERF_5H = 0x2e,
|
PE_PERF_EFB_COPY_CLOCKS_L = 0x2c,
|
||||||
|
PE_PERF_EFB_COPY_CLOCKS_H = 0x2e,
|
||||||
};
|
};
|
||||||
|
|
||||||
namespace PixelEngine
|
namespace PixelEngine
|
||||||
|
|
|
@ -52,6 +52,15 @@ public:
|
||||||
Renderer();
|
Renderer();
|
||||||
virtual ~Renderer();
|
virtual ~Renderer();
|
||||||
|
|
||||||
|
enum PixelPerfQuery {
|
||||||
|
PP_ZCOMP_INPUT_ZCOMPLOC,
|
||||||
|
PP_ZCOMP_OUTPUT_ZCOMPLOC,
|
||||||
|
PP_ZCOMP_INPUT,
|
||||||
|
PP_ZCOMP_OUTPUT,
|
||||||
|
PP_BLEND_INPUT,
|
||||||
|
PP_EFB_COPY_CLOCKS
|
||||||
|
};
|
||||||
|
|
||||||
virtual void SetColorMask() = 0;
|
virtual void SetColorMask() = 0;
|
||||||
virtual void SetBlendMode(bool forceUpdate) = 0;
|
virtual void SetBlendMode(bool forceUpdate) = 0;
|
||||||
virtual void SetScissorRect(const TargetRectangle& rc) = 0;
|
virtual void SetScissorRect(const TargetRectangle& rc) = 0;
|
||||||
|
|
|
@ -132,8 +132,7 @@ void TextureCache::Cleanup()
|
||||||
if ( frameCount > TEXTURE_KILL_THRESHOLD + iter->second->frameCount
|
if ( frameCount > TEXTURE_KILL_THRESHOLD + iter->second->frameCount
|
||||||
|
|
||||||
// EFB copies living on the host GPU are unrecoverable and thus shouldn't be deleted
|
// EFB copies living on the host GPU are unrecoverable and thus shouldn't be deleted
|
||||||
// TODO: encoding the texture back to RAM here might be a good idea
|
&& ! iter->second->IsEfbCopy() )
|
||||||
&& ! (g_ActiveConfig.bCopyEFBToTexture && iter->second->IsEfbCopy()) )
|
|
||||||
{
|
{
|
||||||
delete iter->second;
|
delete iter->second;
|
||||||
textures.erase(iter++);
|
textures.erase(iter++);
|
||||||
|
|
|
@ -257,7 +257,9 @@ void VertexManager::Flush()
|
||||||
//if (g_nativeVertexFmt)
|
//if (g_nativeVertexFmt)
|
||||||
g_nativeVertexFmt->SetupVertexPointers();
|
g_nativeVertexFmt->SetupVertexPointers();
|
||||||
|
|
||||||
|
g_renderer->ResumePixelPerf(false);
|
||||||
g_vertex_manager->Draw(stride, false);
|
g_vertex_manager->Draw(stride, false);
|
||||||
|
g_renderer->PausePixelPerf(false);
|
||||||
|
|
||||||
// run through vertex groups again to set alpha
|
// run through vertex groups again to set alpha
|
||||||
if (false == g_ActiveConfig.bDstAlphaPass && bpmem.dstalpha.enable && bpmem.blendmode.alphaupdate)
|
if (false == g_ActiveConfig.bDstAlphaPass && bpmem.dstalpha.enable && bpmem.blendmode.alphaupdate)
|
||||||
|
|
|
@ -115,7 +115,7 @@ struct VideoConfig
|
||||||
int iAnaglyphStereoSeparation;
|
int iAnaglyphStereoSeparation;
|
||||||
int iAnaglyphFocalAngle;
|
int iAnaglyphFocalAngle;
|
||||||
bool b3DVision;
|
bool b3DVision;
|
||||||
|
|
||||||
// Hacks
|
// Hacks
|
||||||
bool bEFBAccessEnable;
|
bool bEFBAccessEnable;
|
||||||
bool bDlistCachingEnable;
|
bool bDlistCachingEnable;
|
||||||
|
|
|
@ -196,6 +196,7 @@
|
||||||
<ClCompile Include="Src\OpcodeDecoding.cpp" />
|
<ClCompile Include="Src\OpcodeDecoding.cpp" />
|
||||||
<ClCompile Include="Src\OpenCL.cpp" />
|
<ClCompile Include="Src\OpenCL.cpp" />
|
||||||
<ClCompile Include="Src\OpenCL\OCLTextureDecoder.cpp" />
|
<ClCompile Include="Src\OpenCL\OCLTextureDecoder.cpp" />
|
||||||
|
<ClCompile Include="Src\PerfQueryBase.cpp" />
|
||||||
<ClCompile Include="Src\PixelEngine.cpp" />
|
<ClCompile Include="Src\PixelEngine.cpp" />
|
||||||
<ClCompile Include="Src\PixelShaderGen.cpp" />
|
<ClCompile Include="Src\PixelShaderGen.cpp" />
|
||||||
<ClCompile Include="Src\PixelShaderManager.cpp" />
|
<ClCompile Include="Src\PixelShaderManager.cpp" />
|
||||||
|
@ -244,6 +245,7 @@
|
||||||
<ClInclude Include="Src\OpcodeDecoding.h" />
|
<ClInclude Include="Src\OpcodeDecoding.h" />
|
||||||
<ClInclude Include="Src\OpenCL.h" />
|
<ClInclude Include="Src\OpenCL.h" />
|
||||||
<ClInclude Include="Src\OpenCL\OCLTextureDecoder.h" />
|
<ClInclude Include="Src\OpenCL\OCLTextureDecoder.h" />
|
||||||
|
<ClInclude Include="Src\PerfQueryBase.h" />
|
||||||
<ClInclude Include="Src\PixelEngine.h" />
|
<ClInclude Include="Src\PixelEngine.h" />
|
||||||
<ClInclude Include="Src\PixelShaderGen.h" />
|
<ClInclude Include="Src\PixelShaderGen.h" />
|
||||||
<ClInclude Include="Src\PixelShaderManager.h" />
|
<ClInclude Include="Src\PixelShaderManager.h" />
|
||||||
|
|
|
@ -101,6 +101,9 @@
|
||||||
<ClCompile Include="Src\MainBase.cpp">
|
<ClCompile Include="Src\MainBase.cpp">
|
||||||
<Filter>Base</Filter>
|
<Filter>Base</Filter>
|
||||||
</ClCompile>
|
</ClCompile>
|
||||||
|
<ClCompile Include="Src\PerfQueryBase.cpp">
|
||||||
|
<Filter>Base</Filter>
|
||||||
|
</ClCompile>
|
||||||
<ClCompile Include="Src\RenderBase.cpp">
|
<ClCompile Include="Src\RenderBase.cpp">
|
||||||
<Filter>Base</Filter>
|
<Filter>Base</Filter>
|
||||||
</ClCompile>
|
</ClCompile>
|
||||||
|
@ -237,6 +240,9 @@
|
||||||
<ClInclude Include="Src\MainBase.h">
|
<ClInclude Include="Src\MainBase.h">
|
||||||
<Filter>Base</Filter>
|
<Filter>Base</Filter>
|
||||||
</ClInclude>
|
</ClInclude>
|
||||||
|
<ClInclude Include="Src\PerfQueryBase.h">
|
||||||
|
<Filter>Base</Filter>
|
||||||
|
</ClInclude>
|
||||||
<ClInclude Include="Src\RenderBase.h">
|
<ClInclude Include="Src\RenderBase.h">
|
||||||
<Filter>Base</Filter>
|
<Filter>Base</Filter>
|
||||||
</ClInclude>
|
</ClInclude>
|
||||||
|
@ -285,4 +291,4 @@
|
||||||
<UniqueIdentifier>{e2a527a2-ccc8-4ab8-a93e-dd2628c0f3b6}</UniqueIdentifier>
|
<UniqueIdentifier>{e2a527a2-ccc8-4ab8-a93e-dd2628c0f3b6}</UniqueIdentifier>
|
||||||
</Filter>
|
</Filter>
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
</Project>
|
</Project>
|
||||||
|
|
|
@ -199,6 +199,7 @@
|
||||||
<ClCompile Include="Src\LineGeometryShader.cpp" />
|
<ClCompile Include="Src\LineGeometryShader.cpp" />
|
||||||
<ClCompile Include="Src\main.cpp" />
|
<ClCompile Include="Src\main.cpp" />
|
||||||
<ClCompile Include="Src\NativeVertexFormat.cpp" />
|
<ClCompile Include="Src\NativeVertexFormat.cpp" />
|
||||||
|
<ClCompile Include="Src\PerfQuery.cpp" />
|
||||||
<ClCompile Include="Src\PixelShaderCache.cpp" />
|
<ClCompile Include="Src\PixelShaderCache.cpp" />
|
||||||
<ClCompile Include="Src\PointGeometryShader.cpp" />
|
<ClCompile Include="Src\PointGeometryShader.cpp" />
|
||||||
<ClCompile Include="Src\PSTextureEncoder.cpp" />
|
<ClCompile Include="Src\PSTextureEncoder.cpp" />
|
||||||
|
@ -228,6 +229,7 @@
|
||||||
<ClInclude Include="Src\Globals.h" />
|
<ClInclude Include="Src\Globals.h" />
|
||||||
<ClInclude Include="Src\LineGeometryShader.h" />
|
<ClInclude Include="Src\LineGeometryShader.h" />
|
||||||
<ClInclude Include="Src\main.h" />
|
<ClInclude Include="Src\main.h" />
|
||||||
|
<ClInclude Include="Src\PerfQuery.h" />
|
||||||
<ClInclude Include="Src\PixelShaderCache.h" />
|
<ClInclude Include="Src\PixelShaderCache.h" />
|
||||||
<ClInclude Include="Src\PointGeometryShader.h" />
|
<ClInclude Include="Src\PointGeometryShader.h" />
|
||||||
<ClInclude Include="Src\PSTextureEncoder.h" />
|
<ClInclude Include="Src\PSTextureEncoder.h" />
|
||||||
|
|
|
@ -57,6 +57,9 @@
|
||||||
<ClCompile Include="Src\PointGeometryShader.cpp">
|
<ClCompile Include="Src\PointGeometryShader.cpp">
|
||||||
<Filter>Render</Filter>
|
<Filter>Render</Filter>
|
||||||
</ClCompile>
|
</ClCompile>
|
||||||
|
<ClCompile Include="Src\PerfQuery.cpp">
|
||||||
|
<Filter>Render</Filter>
|
||||||
|
</ClCompile>
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<ClInclude Include="Src\Globals.h" />
|
<ClInclude Include="Src\Globals.h" />
|
||||||
|
@ -117,6 +120,9 @@
|
||||||
<ClInclude Include="Src\PointGeometryShader.h">
|
<ClInclude Include="Src\PointGeometryShader.h">
|
||||||
<Filter>Render</Filter>
|
<Filter>Render</Filter>
|
||||||
</ClInclude>
|
</ClInclude>
|
||||||
|
<ClInclude Include="Src\PerfQuery.h">
|
||||||
|
<Filter>Render</Filter>
|
||||||
|
</ClInclude>
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<Filter Include="D3D">
|
<Filter Include="D3D">
|
||||||
|
|
|
@ -0,0 +1,150 @@
|
||||||
|
#include "RenderBase.h"
|
||||||
|
|
||||||
|
#include "D3DBase.h"
|
||||||
|
#include "PerfQuery.h"
|
||||||
|
|
||||||
|
namespace DX11 {
|
||||||
|
|
||||||
|
PerfQuery::PerfQuery()
|
||||||
|
: m_query_read_pos()
|
||||||
|
, m_query_count()
|
||||||
|
{
|
||||||
|
for (int i = 0; i != ARRAYSIZE(m_query_buffer); ++i)
|
||||||
|
{
|
||||||
|
D3D11_QUERY_DESC qdesc = CD3D11_QUERY_DESC(D3D11_QUERY_OCCLUSION, 0);
|
||||||
|
D3D::device->CreateQuery(&qdesc, &m_query_buffer[i].query);
|
||||||
|
}
|
||||||
|
ResetQuery();
|
||||||
|
}
|
||||||
|
|
||||||
|
PerfQuery::~PerfQuery()
|
||||||
|
{
|
||||||
|
for (int i = 0; i != ARRAYSIZE(m_query_buffer); ++i)
|
||||||
|
{
|
||||||
|
// TODO: EndQuery?
|
||||||
|
m_query_buffer[i].query->Release();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::EnableQuery(PerfQueryGroup type)
|
||||||
|
{
|
||||||
|
// Is this sane?
|
||||||
|
if (m_query_count > ARRAYSIZE(m_query_buffer) / 2)
|
||||||
|
WeakFlush();
|
||||||
|
|
||||||
|
if (ARRAYSIZE(m_query_buffer) == m_query_count)
|
||||||
|
{
|
||||||
|
// TODO
|
||||||
|
FlushOne();
|
||||||
|
ERROR_LOG(VIDEO, "flushed query buffer early!");
|
||||||
|
}
|
||||||
|
|
||||||
|
// start query
|
||||||
|
if (type == PQG_ZCOMP_ZCOMPLOC || type == PQG_ZCOMP)
|
||||||
|
{
|
||||||
|
auto& entry = m_query_buffer[(m_query_read_pos + m_query_count) % ARRAYSIZE(m_query_buffer)];
|
||||||
|
|
||||||
|
D3D::context->Begin(entry.query);
|
||||||
|
entry.query_type = type;
|
||||||
|
|
||||||
|
++m_query_count;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::DisableQuery(PerfQueryGroup type)
|
||||||
|
{
|
||||||
|
// stop query
|
||||||
|
if (type == PQG_ZCOMP_ZCOMPLOC || type == PQG_ZCOMP)
|
||||||
|
{
|
||||||
|
auto& entry = m_query_buffer[(m_query_read_pos + m_query_count + ARRAYSIZE(m_query_buffer)-1) % ARRAYSIZE(m_query_buffer)];
|
||||||
|
D3D::context->End(entry.query);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::ResetQuery()
|
||||||
|
{
|
||||||
|
m_query_count = 0;
|
||||||
|
std::fill_n(m_results, ARRAYSIZE(m_results), 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
u32 PerfQuery::GetQueryResult(PerfQueryType type)
|
||||||
|
{
|
||||||
|
u32 result = 0;
|
||||||
|
|
||||||
|
if (type == PQ_ZCOMP_INPUT_ZCOMPLOC || type == PQ_ZCOMP_OUTPUT_ZCOMPLOC)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_ZCOMP_ZCOMPLOC];
|
||||||
|
}
|
||||||
|
else if (type == PQ_ZCOMP_INPUT || type == PQ_ZCOMP_OUTPUT)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_ZCOMP];
|
||||||
|
}
|
||||||
|
else if (type == PQ_BLEND_INPUT)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_ZCOMP] + m_results[PQG_ZCOMP_ZCOMPLOC];
|
||||||
|
}
|
||||||
|
else if (type == PQ_EFB_COPY_CLOCKS)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_EFB_COPY_CLOCKS];
|
||||||
|
}
|
||||||
|
|
||||||
|
return result / 4;
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::FlushOne()
|
||||||
|
{
|
||||||
|
auto& entry = m_query_buffer[m_query_read_pos];
|
||||||
|
|
||||||
|
UINT64 result = 0;
|
||||||
|
HRESULT hr = S_FALSE;
|
||||||
|
while (hr != S_OK)
|
||||||
|
{
|
||||||
|
// TODO: Might cause us to be stuck in an infinite loop!
|
||||||
|
hr = D3D::context->GetData(entry.query, &result, sizeof(result), 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
// NOTE: Reported pixel metrics should be referenced to native resolution
|
||||||
|
m_results[entry.query_type] += (u64)result * EFB_WIDTH / g_renderer->GetTargetWidth() * EFB_HEIGHT / g_renderer->GetTargetHeight();
|
||||||
|
|
||||||
|
m_query_read_pos = (m_query_read_pos + 1) % ARRAYSIZE(m_query_buffer);
|
||||||
|
--m_query_count;
|
||||||
|
}
|
||||||
|
|
||||||
|
// TODO: could selectively flush things, but I don't think that will do much
|
||||||
|
void PerfQuery::FlushResults()
|
||||||
|
{
|
||||||
|
while (!IsFlushed())
|
||||||
|
FlushOne();
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::WeakFlush()
|
||||||
|
{
|
||||||
|
while (!IsFlushed())
|
||||||
|
{
|
||||||
|
auto& entry = m_query_buffer[m_query_read_pos];
|
||||||
|
|
||||||
|
UINT64 result = 0;
|
||||||
|
HRESULT hr = D3D::context->GetData(entry.query, &result, sizeof(result), D3D11_ASYNC_GETDATA_DONOTFLUSH);
|
||||||
|
|
||||||
|
if (hr == S_OK)
|
||||||
|
{
|
||||||
|
// NOTE: Reported pixel metrics should be referenced to native resolution
|
||||||
|
m_results[entry.query_type] += (u64)result * EFB_WIDTH / g_renderer->GetTargetWidth() * EFB_HEIGHT / g_renderer->GetTargetHeight();
|
||||||
|
|
||||||
|
m_query_read_pos = (m_query_read_pos + 1) % ARRAYSIZE(m_query_buffer);
|
||||||
|
--m_query_count;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
bool PerfQuery::IsFlushed() const
|
||||||
|
{
|
||||||
|
return 0 == m_query_count;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
} // namespace
|
|
@ -0,0 +1,46 @@
|
||||||
|
#ifndef _PERFQUERY_H_
|
||||||
|
#define _PERFQUERY_H_
|
||||||
|
|
||||||
|
#include "PerfQueryBase.h"
|
||||||
|
|
||||||
|
namespace DX11 {
|
||||||
|
|
||||||
|
class PerfQuery : public PerfQueryBase
|
||||||
|
{
|
||||||
|
public:
|
||||||
|
PerfQuery();
|
||||||
|
~PerfQuery();
|
||||||
|
|
||||||
|
void EnableQuery(PerfQueryGroup type);
|
||||||
|
void DisableQuery(PerfQueryGroup type);
|
||||||
|
void ResetQuery();
|
||||||
|
u32 GetQueryResult(PerfQueryType type);
|
||||||
|
void FlushResults();
|
||||||
|
bool IsFlushed() const;
|
||||||
|
|
||||||
|
private:
|
||||||
|
struct ActiveQuery
|
||||||
|
{
|
||||||
|
ID3D11Query* query;
|
||||||
|
PerfQueryGroup query_type;
|
||||||
|
};
|
||||||
|
|
||||||
|
void WeakFlush();
|
||||||
|
|
||||||
|
// Only use when non-empty
|
||||||
|
void FlushOne();
|
||||||
|
|
||||||
|
// when testing in SMS: 64 was too small, 128 was ok
|
||||||
|
static const int PERF_QUERY_BUFFER_SIZE = 512;
|
||||||
|
|
||||||
|
ActiveQuery m_query_buffer[PERF_QUERY_BUFFER_SIZE];
|
||||||
|
int m_query_read_pos;
|
||||||
|
|
||||||
|
// TODO: sloppy
|
||||||
|
volatile int m_query_count;
|
||||||
|
volatile u32 m_results[PQG_NUM_MEMBERS];
|
||||||
|
};
|
||||||
|
|
||||||
|
} // namespace
|
||||||
|
|
||||||
|
#endif // _PERFQUERY_H_
|
|
@ -65,6 +65,7 @@ ID3D11RasterizerState* resetraststate = NULL;
|
||||||
|
|
||||||
static ID3D11Texture2D* s_screenshot_texture = NULL;
|
static ID3D11Texture2D* s_screenshot_texture = NULL;
|
||||||
|
|
||||||
|
|
||||||
// GX pipeline state
|
// GX pipeline state
|
||||||
struct
|
struct
|
||||||
{
|
{
|
||||||
|
|
|
@ -208,7 +208,6 @@ void VertexManager::Draw(UINT stride)
|
||||||
if (IndexGenerator::GetNumLines() > 0 || IndexGenerator::GetNumPoints() > 0)
|
if (IndexGenerator::GetNumLines() > 0 || IndexGenerator::GetNumPoints() > 0)
|
||||||
((DX11::Renderer*)g_renderer)->RestoreCull();
|
((DX11::Renderer*)g_renderer)->RestoreCull();
|
||||||
}
|
}
|
||||||
|
|
||||||
void VertexManager::vFlush()
|
void VertexManager::vFlush()
|
||||||
{
|
{
|
||||||
if (LocalVBuffer == s_pCurBufferPointer) return;
|
if (LocalVBuffer == s_pCurBufferPointer) return;
|
||||||
|
@ -274,8 +273,10 @@ void VertexManager::vFlush()
|
||||||
unsigned int stride = g_nativeVertexFmt->GetVertexStride();
|
unsigned int stride = g_nativeVertexFmt->GetVertexStride();
|
||||||
g_nativeVertexFmt->SetupVertexPointers();
|
g_nativeVertexFmt->SetupVertexPointers();
|
||||||
g_renderer->ApplyState(useDstAlpha);
|
g_renderer->ApplyState(useDstAlpha);
|
||||||
|
|
||||||
|
g_perf_query->EnableQuery(bpmem.zcontrol.early_ztest ? PQG_ZCOMP_ZCOMPLOC : PQG_ZCOMP);
|
||||||
Draw(stride);
|
Draw(stride);
|
||||||
|
g_perf_query->DisableQuery(bpmem.zcontrol.early_ztest ? PQG_ZCOMP_ZCOMPLOC : PQG_ZCOMP);
|
||||||
|
|
||||||
GFX_DEBUGGER_PAUSE_AT(NEXT_FLUSH, true);
|
GFX_DEBUGGER_PAUSE_AT(NEXT_FLUSH, true);
|
||||||
|
|
||||||
|
|
|
@ -42,6 +42,7 @@
|
||||||
|
|
||||||
#include "D3DUtil.h"
|
#include "D3DUtil.h"
|
||||||
#include "D3DBase.h"
|
#include "D3DBase.h"
|
||||||
|
#include "PerfQuery.h"
|
||||||
#include "PixelShaderCache.h"
|
#include "PixelShaderCache.h"
|
||||||
#include "TextureCache.h"
|
#include "TextureCache.h"
|
||||||
#include "VertexManager.h"
|
#include "VertexManager.h"
|
||||||
|
@ -183,6 +184,7 @@ void VideoBackend::Video_Prepare()
|
||||||
g_renderer = new Renderer;
|
g_renderer = new Renderer;
|
||||||
g_texture_cache = new TextureCache;
|
g_texture_cache = new TextureCache;
|
||||||
g_vertex_manager = new VertexManager;
|
g_vertex_manager = new VertexManager;
|
||||||
|
g_perf_query = new PerfQuery;
|
||||||
VertexShaderCache::Init();
|
VertexShaderCache::Init();
|
||||||
PixelShaderCache::Init();
|
PixelShaderCache::Init();
|
||||||
D3D::InitUtils();
|
D3D::InitUtils();
|
||||||
|
@ -225,6 +227,7 @@ void VideoBackend::Shutdown()
|
||||||
D3D::ShutdownUtils();
|
D3D::ShutdownUtils();
|
||||||
PixelShaderCache::Shutdown();
|
PixelShaderCache::Shutdown();
|
||||||
VertexShaderCache::Shutdown();
|
VertexShaderCache::Shutdown();
|
||||||
|
delete g_perf_query;
|
||||||
delete g_vertex_manager;
|
delete g_vertex_manager;
|
||||||
delete g_texture_cache;
|
delete g_texture_cache;
|
||||||
delete g_renderer;
|
delete g_renderer;
|
||||||
|
|
|
@ -57,6 +57,7 @@
|
||||||
|
|
||||||
#include "ConfigManager.h"
|
#include "ConfigManager.h"
|
||||||
#include "VideoBackend.h"
|
#include "VideoBackend.h"
|
||||||
|
#include "PerfQueryBase.h"
|
||||||
|
|
||||||
namespace DX9
|
namespace DX9
|
||||||
{
|
{
|
||||||
|
@ -97,8 +98,6 @@ void InitBackendInfo()
|
||||||
g_Config.backend_info.bSupports3DVision = true;
|
g_Config.backend_info.bSupports3DVision = true;
|
||||||
g_Config.backend_info.bSupportsDualSourceBlend = false;
|
g_Config.backend_info.bSupportsDualSourceBlend = false;
|
||||||
g_Config.backend_info.bSupportsFormatReinterpretation = true;
|
g_Config.backend_info.bSupportsFormatReinterpretation = true;
|
||||||
|
|
||||||
|
|
||||||
g_Config.backend_info.bSupportsPixelLighting = C_PLIGHTS + 40 <= maxConstants && C_PMATERIALS + 4 <= maxConstants;
|
g_Config.backend_info.bSupportsPixelLighting = C_PLIGHTS + 40 <= maxConstants && C_PMATERIALS + 4 <= maxConstants;
|
||||||
|
|
||||||
// adapters
|
// adapters
|
||||||
|
@ -172,6 +171,7 @@ void VideoBackend::Video_Prepare()
|
||||||
g_vertex_manager = new VertexManager;
|
g_vertex_manager = new VertexManager;
|
||||||
g_renderer = new Renderer;
|
g_renderer = new Renderer;
|
||||||
g_texture_cache = new TextureCache;
|
g_texture_cache = new TextureCache;
|
||||||
|
g_perf_query = new PerfQueryBase;
|
||||||
// VideoCommon
|
// VideoCommon
|
||||||
BPInit();
|
BPInit();
|
||||||
Fifo_Init();
|
Fifo_Init();
|
||||||
|
@ -209,6 +209,7 @@ void VideoBackend::Shutdown()
|
||||||
// internal interfaces
|
// internal interfaces
|
||||||
PixelShaderCache::Shutdown();
|
PixelShaderCache::Shutdown();
|
||||||
VertexShaderCache::Shutdown();
|
VertexShaderCache::Shutdown();
|
||||||
|
delete g_perf_query;
|
||||||
delete g_texture_cache;
|
delete g_texture_cache;
|
||||||
delete g_renderer;
|
delete g_renderer;
|
||||||
delete g_vertex_manager;
|
delete g_vertex_manager;
|
||||||
|
|
|
@ -2,6 +2,7 @@ set(SRCS Src/FramebufferManager.cpp
|
||||||
Src/GLUtil.cpp
|
Src/GLUtil.cpp
|
||||||
Src/main.cpp
|
Src/main.cpp
|
||||||
Src/NativeVertexFormat.cpp
|
Src/NativeVertexFormat.cpp
|
||||||
|
Src/PerfQuery.cpp
|
||||||
Src/PixelShaderCache.cpp
|
Src/PixelShaderCache.cpp
|
||||||
Src/PostProcessing.cpp
|
Src/PostProcessing.cpp
|
||||||
Src/RasterFont.cpp
|
Src/RasterFont.cpp
|
||||||
|
|
|
@ -200,6 +200,7 @@
|
||||||
<ClCompile Include="Src\GLUtil.cpp" />
|
<ClCompile Include="Src\GLUtil.cpp" />
|
||||||
<ClCompile Include="Src\main.cpp" />
|
<ClCompile Include="Src\main.cpp" />
|
||||||
<ClCompile Include="Src\NativeVertexFormat.cpp" />
|
<ClCompile Include="Src\NativeVertexFormat.cpp" />
|
||||||
|
<ClCompile Include="Src\PerfQuery.cpp" />
|
||||||
<ClCompile Include="Src\PixelShaderCache.cpp" />
|
<ClCompile Include="Src\PixelShaderCache.cpp" />
|
||||||
<ClCompile Include="Src\PostProcessing.cpp" />
|
<ClCompile Include="Src\PostProcessing.cpp" />
|
||||||
<ClCompile Include="Src\RasterFont.cpp" />
|
<ClCompile Include="Src\RasterFont.cpp" />
|
||||||
|
@ -222,6 +223,7 @@
|
||||||
<ClInclude Include="Src\Globals.h" />
|
<ClInclude Include="Src\Globals.h" />
|
||||||
<ClInclude Include="Src\GLUtil.h" />
|
<ClInclude Include="Src\GLUtil.h" />
|
||||||
<ClInclude Include="Src\main.h" />
|
<ClInclude Include="Src\main.h" />
|
||||||
|
<ClInclude Include="Src\PerfQuery.h" />
|
||||||
<ClInclude Include="Src\PixelShaderCache.h" />
|
<ClInclude Include="Src\PixelShaderCache.h" />
|
||||||
<ClInclude Include="Src\PostProcessing.h" />
|
<ClInclude Include="Src\PostProcessing.h" />
|
||||||
<ClInclude Include="Src\RasterFont.h" />
|
<ClInclude Include="Src\RasterFont.h" />
|
||||||
|
|
|
@ -36,6 +36,9 @@
|
||||||
<ClCompile Include="Src\VertexShaderCache.cpp">
|
<ClCompile Include="Src\VertexShaderCache.cpp">
|
||||||
<Filter>Render</Filter>
|
<Filter>Render</Filter>
|
||||||
</ClCompile>
|
</ClCompile>
|
||||||
|
<ClCompile Include="Src\PerfQuery.cpp">
|
||||||
|
<Filter>Render</Filter>
|
||||||
|
</ClCompile>
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<ClInclude Include="Src\Globals.h" />
|
<ClInclude Include="Src\Globals.h" />
|
||||||
|
@ -72,6 +75,9 @@
|
||||||
<ClInclude Include="Src\VertexShaderCache.h">
|
<ClInclude Include="Src\VertexShaderCache.h">
|
||||||
<Filter>Render</Filter>
|
<Filter>Render</Filter>
|
||||||
</ClInclude>
|
</ClInclude>
|
||||||
|
<ClInclude Include="Src\PerfQuery.h">
|
||||||
|
<Filter>Render</Filter>
|
||||||
|
</ClInclude>
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
<None Include="CMakeLists.txt" />
|
<None Include="CMakeLists.txt" />
|
||||||
|
|
|
@ -0,0 +1,133 @@
|
||||||
|
#include "RenderBase.h"
|
||||||
|
#include "GLUtil.h"
|
||||||
|
#include "PerfQuery.h"
|
||||||
|
|
||||||
|
namespace OGL
|
||||||
|
{
|
||||||
|
|
||||||
|
PerfQuery::PerfQuery()
|
||||||
|
: m_query_read_pos()
|
||||||
|
, m_query_count()
|
||||||
|
{
|
||||||
|
for (int i = 0; i != ARRAYSIZE(m_query_buffer); ++i)
|
||||||
|
glGenQueries(1, &m_query_buffer[i].query_id);
|
||||||
|
|
||||||
|
ResetQuery();
|
||||||
|
}
|
||||||
|
|
||||||
|
PerfQuery::~PerfQuery()
|
||||||
|
{
|
||||||
|
for (int i = 0; i != ARRAYSIZE(m_query_buffer); ++i)
|
||||||
|
glDeleteQueries(1, &m_query_buffer[i].query_id);
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::EnableQuery(PerfQueryGroup type)
|
||||||
|
{
|
||||||
|
// Is this sane?
|
||||||
|
if (m_query_count > ARRAYSIZE(m_query_buffer) / 2)
|
||||||
|
WeakFlush();
|
||||||
|
|
||||||
|
if (ARRAYSIZE(m_query_buffer) == m_query_count)
|
||||||
|
{
|
||||||
|
FlushOne();
|
||||||
|
//ERROR_LOG(VIDEO, "flushed query buffer early!");
|
||||||
|
}
|
||||||
|
|
||||||
|
// start query
|
||||||
|
if (type == PQG_ZCOMP_ZCOMPLOC || type == PQG_ZCOMP)
|
||||||
|
{
|
||||||
|
auto& entry = m_query_buffer[(m_query_read_pos + m_query_count) % ARRAYSIZE(m_query_buffer)];
|
||||||
|
|
||||||
|
glBeginQuery(GL_SAMPLES_PASSED, entry.query_id);
|
||||||
|
entry.query_type = type;
|
||||||
|
|
||||||
|
++m_query_count;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::DisableQuery(PerfQueryGroup type)
|
||||||
|
{
|
||||||
|
// stop query
|
||||||
|
if (type == PQG_ZCOMP_ZCOMPLOC || type == PQG_ZCOMP)
|
||||||
|
{
|
||||||
|
glEndQuery(GL_SAMPLES_PASSED);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
bool PerfQuery::IsFlushed() const
|
||||||
|
{
|
||||||
|
return 0 == m_query_count;
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::FlushOne()
|
||||||
|
{
|
||||||
|
auto& entry = m_query_buffer[m_query_read_pos];
|
||||||
|
|
||||||
|
GLuint result = 0;
|
||||||
|
glGetQueryObjectuiv(entry.query_id, GL_QUERY_RESULT, &result);
|
||||||
|
|
||||||
|
// NOTE: Reported pixel metrics should be referenced to native resolution
|
||||||
|
m_results[entry.query_type] += (u64)result * EFB_WIDTH / g_renderer->GetTargetWidth() * EFB_HEIGHT / g_renderer->GetTargetHeight();
|
||||||
|
|
||||||
|
m_query_read_pos = (m_query_read_pos + 1) % ARRAYSIZE(m_query_buffer);
|
||||||
|
--m_query_count;
|
||||||
|
}
|
||||||
|
|
||||||
|
// TODO: could selectively flush things, but I don't think that will do much
|
||||||
|
void PerfQuery::FlushResults()
|
||||||
|
{
|
||||||
|
while (!IsFlushed())
|
||||||
|
FlushOne();
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::WeakFlush()
|
||||||
|
{
|
||||||
|
while (!IsFlushed())
|
||||||
|
{
|
||||||
|
auto& entry = m_query_buffer[m_query_read_pos];
|
||||||
|
|
||||||
|
GLuint result = GL_FALSE;
|
||||||
|
glGetQueryObjectuiv(entry.query_id, GL_QUERY_RESULT_AVAILABLE, &result);
|
||||||
|
|
||||||
|
if (GL_TRUE == result)
|
||||||
|
{
|
||||||
|
FlushOne();
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
void PerfQuery::ResetQuery()
|
||||||
|
{
|
||||||
|
m_query_count = 0;
|
||||||
|
std::fill_n(m_results, ARRAYSIZE(m_results), 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
u32 PerfQuery::GetQueryResult(PerfQueryType type)
|
||||||
|
{
|
||||||
|
u32 result = 0;
|
||||||
|
|
||||||
|
if (type == PQ_ZCOMP_INPUT_ZCOMPLOC || type == PQ_ZCOMP_OUTPUT_ZCOMPLOC)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_ZCOMP_ZCOMPLOC];
|
||||||
|
}
|
||||||
|
else if (type == PQ_ZCOMP_INPUT || type == PQ_ZCOMP_OUTPUT)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_ZCOMP];
|
||||||
|
}
|
||||||
|
else if (type == PQ_BLEND_INPUT)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_ZCOMP] + m_results[PQG_ZCOMP_ZCOMPLOC];
|
||||||
|
}
|
||||||
|
else if (type == PQ_EFB_COPY_CLOCKS)
|
||||||
|
{
|
||||||
|
result = m_results[PQG_EFB_COPY_CLOCKS];
|
||||||
|
}
|
||||||
|
|
||||||
|
return result / 4;
|
||||||
|
}
|
||||||
|
|
||||||
|
} // namespace
|
|
@ -0,0 +1,46 @@
|
||||||
|
#ifndef _PERFQUERY_H_
|
||||||
|
#define _PERFQUERY_H_
|
||||||
|
|
||||||
|
#include "PerfQueryBase.h"
|
||||||
|
|
||||||
|
namespace OGL {
|
||||||
|
|
||||||
|
class PerfQuery : public PerfQueryBase
|
||||||
|
{
|
||||||
|
public:
|
||||||
|
PerfQuery();
|
||||||
|
~PerfQuery();
|
||||||
|
|
||||||
|
void EnableQuery(PerfQueryGroup type);
|
||||||
|
void DisableQuery(PerfQueryGroup type);
|
||||||
|
void ResetQuery();
|
||||||
|
u32 GetQueryResult(PerfQueryType type);
|
||||||
|
void FlushResults();
|
||||||
|
bool IsFlushed() const;
|
||||||
|
|
||||||
|
private:
|
||||||
|
struct ActiveQuery
|
||||||
|
{
|
||||||
|
GLuint query_id;
|
||||||
|
PerfQueryGroup query_type;
|
||||||
|
};
|
||||||
|
|
||||||
|
// when testing in SMS: 64 was too small, 128 was ok
|
||||||
|
static const int PERF_QUERY_BUFFER_SIZE = 512;
|
||||||
|
|
||||||
|
void WeakFlush();
|
||||||
|
// Only use when non-empty
|
||||||
|
void FlushOne();
|
||||||
|
|
||||||
|
// This contains gl query objects with unretrieved results.
|
||||||
|
ActiveQuery m_query_buffer[PERF_QUERY_BUFFER_SIZE];
|
||||||
|
int m_query_read_pos;
|
||||||
|
|
||||||
|
// TODO: sloppy
|
||||||
|
volatile int m_query_count;
|
||||||
|
volatile u32 m_results[PQG_NUM_MEMBERS];
|
||||||
|
};
|
||||||
|
|
||||||
|
} // namespace
|
||||||
|
|
||||||
|
#endif // _PERFQUERY_H_
|
|
@ -1420,6 +1420,7 @@ void Renderer::SetDepthMode()
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
// if the test is disabled write is disabled too
|
// if the test is disabled write is disabled too
|
||||||
|
// TODO: When PE performance metrics are being emulated via occlusion queries, we should (probably?) enable depth test with depth function ALWAYS here
|
||||||
glDisable(GL_DEPTH_TEST);
|
glDisable(GL_DEPTH_TEST);
|
||||||
glDepthMask(GL_FALSE);
|
glDepthMask(GL_FALSE);
|
||||||
}
|
}
|
||||||
|
|
|
@ -40,6 +40,7 @@
|
||||||
#include "OpcodeDecoding.h"
|
#include "OpcodeDecoding.h"
|
||||||
#include "FileUtil.h"
|
#include "FileUtil.h"
|
||||||
#include "Debugger.h"
|
#include "Debugger.h"
|
||||||
|
#include "PerfQueryBase.h"
|
||||||
|
|
||||||
#include "main.h"
|
#include "main.h"
|
||||||
|
|
||||||
|
@ -217,7 +218,10 @@ void VertexManager::vFlush()
|
||||||
if (ps) PixelShaderCache::SetCurrentShader(ps->glprogid); // Lego Star Wars crashes here.
|
if (ps) PixelShaderCache::SetCurrentShader(ps->glprogid); // Lego Star Wars crashes here.
|
||||||
if (vs) VertexShaderCache::SetCurrentShader(vs->glprogid);
|
if (vs) VertexShaderCache::SetCurrentShader(vs->glprogid);
|
||||||
|
|
||||||
|
g_perf_query->EnableQuery(bpmem.zcontrol.early_ztest ? PQG_ZCOMP_ZCOMPLOC : PQG_ZCOMP);
|
||||||
Draw();
|
Draw();
|
||||||
|
g_perf_query->DisableQuery(bpmem.zcontrol.early_ztest ? PQG_ZCOMP_ZCOMPLOC : PQG_ZCOMP);
|
||||||
|
//ERROR_LOG(VIDEO, "PerfQuery result: %d", g_perf_query->GetQueryResult(bpmem.zcontrol.early_ztest ? PQ_ZCOMP_OUTPUT_ZCOMPLOC : PQ_ZCOMP_OUTPUT));
|
||||||
|
|
||||||
// run through vertex groups again to set alpha
|
// run through vertex groups again to set alpha
|
||||||
if (useDstAlpha && !dualSourcePossible)
|
if (useDstAlpha && !dualSourcePossible)
|
||||||
|
|
|
@ -92,6 +92,7 @@ Make AA apply instantly during gameplay if possible
|
||||||
#include "FramebufferManager.h"
|
#include "FramebufferManager.h"
|
||||||
#include "Core.h"
|
#include "Core.h"
|
||||||
#include "Host.h"
|
#include "Host.h"
|
||||||
|
#include "PerfQuery.h"
|
||||||
|
|
||||||
#include "VideoState.h"
|
#include "VideoState.h"
|
||||||
#include "VideoBackend.h"
|
#include "VideoBackend.h"
|
||||||
|
@ -194,6 +195,7 @@ void VideoBackend::Video_Prepare()
|
||||||
|
|
||||||
BPInit();
|
BPInit();
|
||||||
g_vertex_manager = new VertexManager;
|
g_vertex_manager = new VertexManager;
|
||||||
|
g_perf_query = new PerfQuery;
|
||||||
Fifo_Init(); // must be done before OpcodeDecoder_Init()
|
Fifo_Init(); // must be done before OpcodeDecoder_Init()
|
||||||
OpcodeDecoder_Init();
|
OpcodeDecoder_Init();
|
||||||
VertexShaderCache::Init();
|
VertexShaderCache::Init();
|
||||||
|
|
|
@ -90,6 +90,21 @@ void SWBPWritten(int address, int newvalue)
|
||||||
SWPixelEngine::pereg.boxBottom = newvalue >> 10;
|
SWPixelEngine::pereg.boxBottom = newvalue >> 10;
|
||||||
SWPixelEngine::pereg.boxTop = newvalue & 0x3ff;
|
SWPixelEngine::pereg.boxTop = newvalue & 0x3ff;
|
||||||
break;
|
break;
|
||||||
|
case BPMEM_CLEAR_PIXEL_PERF:
|
||||||
|
// TODO: I didn't test if the value written to this register affects the amount of cleared registers
|
||||||
|
SWPixelEngine::pereg.perfZcompInputZcomplocLo = 0;
|
||||||
|
SWPixelEngine::pereg.perfZcompInputZcomplocHi = 0;
|
||||||
|
SWPixelEngine::pereg.perfZcompOutputZcomplocLo = 0;
|
||||||
|
SWPixelEngine::pereg.perfZcompOutputZcomplocHi = 0;
|
||||||
|
SWPixelEngine::pereg.perfZcompInputLo = 0;
|
||||||
|
SWPixelEngine::pereg.perfZcompInputHi = 0;
|
||||||
|
SWPixelEngine::pereg.perfZcompOutputLo = 0;
|
||||||
|
SWPixelEngine::pereg.perfZcompOutputHi = 0;
|
||||||
|
SWPixelEngine::pereg.perfBlendInputLo = 0;
|
||||||
|
SWPixelEngine::pereg.perfBlendInputHi = 0;
|
||||||
|
SWPixelEngine::pereg.perfEfbCopyClocksLo = 0;
|
||||||
|
SWPixelEngine::pereg.perfEfbCopyClocksHi = 0;
|
||||||
|
break;
|
||||||
case BPMEM_LOADTLUT0: // This one updates bpmem.tlutXferSrc, no need to do anything here.
|
case BPMEM_LOADTLUT0: // This one updates bpmem.tlutXferSrc, no need to do anything here.
|
||||||
break;
|
break;
|
||||||
case BPMEM_LOADTLUT1: // Load a Texture Look Up Table
|
case BPMEM_LOADTLUT1: // Load a Texture Look Up Table
|
||||||
|
|
|
@ -65,6 +65,13 @@ namespace Clipper
|
||||||
OutputVertexData ClippedVertices[NUM_CLIPPED_VERTICES];
|
OutputVertexData ClippedVertices[NUM_CLIPPED_VERTICES];
|
||||||
OutputVertexData *Vertices[NUM_INDICES];
|
OutputVertexData *Vertices[NUM_INDICES];
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
p.DoArray(m_ViewOffset,2);
|
||||||
|
for (int i = 0; i< NUM_CLIPPED_VERTICES; ++i)
|
||||||
|
ClippedVertices[i].DoState(p);
|
||||||
|
}
|
||||||
|
|
||||||
void Init()
|
void Init()
|
||||||
{
|
{
|
||||||
for (int i = 0; i < NUM_CLIPPED_VERTICES; ++i)
|
for (int i = 0; i < NUM_CLIPPED_VERTICES; ++i)
|
||||||
|
|
|
@ -21,6 +21,7 @@
|
||||||
|
|
||||||
#include "Common.h"
|
#include "Common.h"
|
||||||
#include "NativeVertexFormat.h"
|
#include "NativeVertexFormat.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
|
|
||||||
namespace Clipper
|
namespace Clipper
|
||||||
|
@ -36,6 +37,8 @@ namespace Clipper
|
||||||
bool CullTest(OutputVertexData *v0, OutputVertexData *v1, OutputVertexData *v2, bool &backface);
|
bool CullTest(OutputVertexData *v0, OutputVertexData *v1, OutputVertexData *v2, bool &backface);
|
||||||
|
|
||||||
void PerspectiveDivide(OutputVertexData *vertex);
|
void PerspectiveDivide(OutputVertexData *vertex);
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
|
@ -28,6 +28,7 @@ u8 efb[EFB_WIDTH*EFB_HEIGHT*6];
|
||||||
|
|
||||||
namespace EfbInterface
|
namespace EfbInterface
|
||||||
{
|
{
|
||||||
|
|
||||||
u8 efbColorTexture[EFB_WIDTH*EFB_HEIGHT*4];
|
u8 efbColorTexture[EFB_WIDTH*EFB_HEIGHT*4];
|
||||||
|
|
||||||
inline u32 GetColorOffset(u16 x, u16 y)
|
inline u32 GetColorOffset(u16 x, u16 y)
|
||||||
|
@ -40,6 +41,12 @@ namespace EfbInterface
|
||||||
return (x + y * EFB_WIDTH) * 3 + DEPTH_BUFFER_START;
|
return (x + y * EFB_WIDTH) * 3 + DEPTH_BUFFER_START;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
p.DoArray(efb, EFB_WIDTH*EFB_HEIGHT*6);
|
||||||
|
p.DoArray(efbColorTexture, EFB_WIDTH*EFB_HEIGHT*4);
|
||||||
|
}
|
||||||
|
|
||||||
void SetPixelAlphaOnly(u32 offset, u8 a)
|
void SetPixelAlphaOnly(u32 offset, u8 a)
|
||||||
{
|
{
|
||||||
switch (bpmem.zcontrol.pixel_format)
|
switch (bpmem.zcontrol.pixel_format)
|
||||||
|
|
|
@ -47,6 +47,7 @@ namespace EfbInterface
|
||||||
|
|
||||||
void UpdateColorTexture();
|
void UpdateColorTexture();
|
||||||
extern u8 efbColorTexture[EFB_WIDTH*EFB_HEIGHT*4]; // RGBA format
|
extern u8 efbColorTexture[EFB_WIDTH*EFB_HEIGHT*4]; // RGBA format
|
||||||
|
void DoState(PointerWrap &p);
|
||||||
}
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -19,6 +19,7 @@
|
||||||
#define _NATIVEVERTEXFORMAT_H
|
#define _NATIVEVERTEXFORMAT_H
|
||||||
|
|
||||||
#include "Vec3.h"
|
#include "Vec3.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
#ifdef WIN32
|
#ifdef WIN32
|
||||||
#define LOADERDECL __cdecl
|
#define LOADERDECL __cdecl
|
||||||
|
@ -92,6 +93,18 @@ struct OutputVertexData
|
||||||
#undef LINTERP
|
#undef LINTERP
|
||||||
#undef LINTERP_INT
|
#undef LINTERP_INT
|
||||||
}
|
}
|
||||||
|
void DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
mvPosition.DoState(p);
|
||||||
|
p.Do(projectedPosition);
|
||||||
|
screenPosition.DoState(p);
|
||||||
|
for (int i = 0; i < 3;++i)
|
||||||
|
normal[i].DoState(p);
|
||||||
|
p.DoArray(color, sizeof color);
|
||||||
|
for (int i = 0; i < 8;++i)
|
||||||
|
texCoords[i].DoState(p);
|
||||||
|
}
|
||||||
|
|
||||||
};
|
};
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -35,7 +35,6 @@ typedef void (*DecodingFunction)(u32);
|
||||||
|
|
||||||
namespace OpcodeDecoder
|
namespace OpcodeDecoder
|
||||||
{
|
{
|
||||||
|
|
||||||
static DecodingFunction currentFunction = NULL;
|
static DecodingFunction currentFunction = NULL;
|
||||||
static u32 minCommandSize;
|
static u32 minCommandSize;
|
||||||
static u16 streamSize;
|
static u16 streamSize;
|
||||||
|
@ -46,6 +45,20 @@ static bool inObjectStream;
|
||||||
static u8 lastPrimCmd;
|
static u8 lastPrimCmd;
|
||||||
|
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
p.Do(minCommandSize);
|
||||||
|
// Not sure what is wrong with this. Something(s) in here is causing dolphin to crash/hang when loading states saved from another run of dolphin. Doesn't seem too important anyway...
|
||||||
|
//vertexLoader.DoState(p);
|
||||||
|
p.Do(readOpcode);
|
||||||
|
p.Do(inObjectStream);
|
||||||
|
p.Do(lastPrimCmd);
|
||||||
|
p.Do(streamSize);
|
||||||
|
p.Do(streamAddress);
|
||||||
|
if (p.GetMode() == PointerWrap::MODE_READ)
|
||||||
|
ResetDecoding();
|
||||||
|
}
|
||||||
|
|
||||||
void DecodePrimitiveStream(u32 iBufferSize)
|
void DecodePrimitiveStream(u32 iBufferSize)
|
||||||
{
|
{
|
||||||
u32 vertexSize = vertexLoader.GetVertexSize();
|
u32 vertexSize = vertexLoader.GetVertexSize();
|
||||||
|
|
|
@ -20,6 +20,7 @@
|
||||||
#define _OPCODEDECODER_H_
|
#define _OPCODEDECODER_H_
|
||||||
|
|
||||||
#include "CommonTypes.h"
|
#include "CommonTypes.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
namespace OpcodeDecoder
|
namespace OpcodeDecoder
|
||||||
{
|
{
|
||||||
|
@ -57,6 +58,8 @@ namespace OpcodeDecoder
|
||||||
bool CommandRunnable(u32 iBufferSize);
|
bool CommandRunnable(u32 iBufferSize);
|
||||||
|
|
||||||
void Run(u32 iBufferSize);
|
void Run(u32 iBufferSize);
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p);
|
||||||
}
|
}
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -23,6 +23,7 @@
|
||||||
#include "BPMemLoader.h"
|
#include "BPMemLoader.h"
|
||||||
#include "XFMemLoader.h"
|
#include "XFMemLoader.h"
|
||||||
#include "Tev.h"
|
#include "Tev.h"
|
||||||
|
#include "SWPixelEngine.h"
|
||||||
#include "SWStatistics.h"
|
#include "SWStatistics.h"
|
||||||
#include "SWVideoConfig.h"
|
#include "SWVideoConfig.h"
|
||||||
|
|
||||||
|
@ -62,6 +63,28 @@ s32 scissorBottom = 0;
|
||||||
Tev tev;
|
Tev tev;
|
||||||
RasterBlock rasterBlock;
|
RasterBlock rasterBlock;
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
ZSlope.DoState(p);
|
||||||
|
WSlope.DoState(p);
|
||||||
|
for (int i=0;i<2;++i)
|
||||||
|
for (int n=0; n<4; ++n)
|
||||||
|
ColorSlopes[i][n].DoState(p);
|
||||||
|
for (int i=0;i<8;++i)
|
||||||
|
for (int n=0; n<3; ++n)
|
||||||
|
TexSlopes[i][n].DoState(p);
|
||||||
|
p.Do(vertex0X);
|
||||||
|
p.Do(vertex0Y);
|
||||||
|
p.Do(vertexOffsetX);
|
||||||
|
p.Do(vertexOffsetY);
|
||||||
|
p.Do(scissorLeft);
|
||||||
|
p.Do(scissorTop);
|
||||||
|
p.Do(scissorRight);
|
||||||
|
p.Do(scissorBottom);
|
||||||
|
tev.DoState(p);
|
||||||
|
p.Do(rasterBlock);
|
||||||
|
}
|
||||||
|
|
||||||
void Init()
|
void Init()
|
||||||
{
|
{
|
||||||
tev.Init();
|
tev.Init();
|
||||||
|
@ -127,9 +150,15 @@ inline void Draw(s32 x, s32 y, s32 xi, s32 yi)
|
||||||
|
|
||||||
if (bpmem.zcontrol.early_ztest && bpmem.zmode.testenable && g_SWVideoConfig.bZComploc)
|
if (bpmem.zcontrol.early_ztest && bpmem.zmode.testenable && g_SWVideoConfig.bZComploc)
|
||||||
{
|
{
|
||||||
// early z
|
// TODO: Test if perf regs are incremented even if test is disabled
|
||||||
if (!EfbInterface::ZCompare(x, y, z))
|
SWPixelEngine::pereg.IncZInputQuadCount(true);
|
||||||
return;
|
if (bpmem.zmode.testenable)
|
||||||
|
{
|
||||||
|
// early z
|
||||||
|
if (!EfbInterface::ZCompare(x, y, z))
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
SWPixelEngine::pereg.IncZOutputQuadCount(true);
|
||||||
}
|
}
|
||||||
|
|
||||||
RasterBlockPixel& pixel = rasterBlock.Pixel[xi][yi];
|
RasterBlockPixel& pixel = rasterBlock.Pixel[xi][yi];
|
||||||
|
|
|
@ -19,6 +19,7 @@
|
||||||
#define _RASTERIZER_H_
|
#define _RASTERIZER_H_
|
||||||
|
|
||||||
#include "NativeVertexFormat.h"
|
#include "NativeVertexFormat.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
namespace Rasterizer
|
namespace Rasterizer
|
||||||
{
|
{
|
||||||
|
@ -37,6 +38,12 @@ namespace Rasterizer
|
||||||
float f0;
|
float f0;
|
||||||
|
|
||||||
float GetValue(float dx, float dy) { return f0 + (dfdx * dx) + (dfdy * dy); }
|
float GetValue(float dx, float dy) { return f0 + (dfdx * dx) + (dfdy * dy); }
|
||||||
|
void DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
p.Do(dfdx);
|
||||||
|
p.Do(dfdy);
|
||||||
|
p.Do(f0);
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
struct RasterBlockPixel
|
struct RasterBlockPixel
|
||||||
|
@ -53,6 +60,8 @@ namespace Rasterizer
|
||||||
s32 TextureLod[16];
|
s32 TextureLod[16];
|
||||||
bool TextureLinear[16];
|
bool TextureLinear[16];
|
||||||
};
|
};
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p);
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -57,6 +57,15 @@ CPReg cpreg; // shared between gfx and emulator thread
|
||||||
void DoState(PointerWrap &p)
|
void DoState(PointerWrap &p)
|
||||||
{
|
{
|
||||||
p.Do(cpreg);
|
p.Do(cpreg);
|
||||||
|
p.DoArray(commandBuffer, commandBufferSize);
|
||||||
|
p.Do(readPos);
|
||||||
|
p.Do(writePos);
|
||||||
|
p.Do(et_UpdateInterrupts);
|
||||||
|
p.Do(interruptSet);
|
||||||
|
p.Do(interruptWaiting);
|
||||||
|
|
||||||
|
// Is this right?
|
||||||
|
p.DoArray(g_pVideoData,writePos);
|
||||||
}
|
}
|
||||||
|
|
||||||
// does it matter that there is no synchronization between threads during writes?
|
// does it matter that there is no synchronization between threads during writes?
|
||||||
|
|
|
@ -53,6 +53,8 @@ void DoState(PointerWrap &p)
|
||||||
p.Do(pereg);
|
p.Do(pereg);
|
||||||
p.Do(g_bSignalTokenInterrupt);
|
p.Do(g_bSignalTokenInterrupt);
|
||||||
p.Do(g_bSignalFinishInterrupt);
|
p.Do(g_bSignalFinishInterrupt);
|
||||||
|
p.Do(et_SetTokenOnMainThread);
|
||||||
|
p.Do(et_SetFinishOnMainThread);
|
||||||
}
|
}
|
||||||
|
|
||||||
void UpdateInterrupts();
|
void UpdateInterrupts();
|
||||||
|
@ -77,7 +79,7 @@ void Read16(u16& _uReturnValue, const u32 _iAddress)
|
||||||
|
|
||||||
u16 address = _iAddress & 0xFFF;
|
u16 address = _iAddress & 0xFFF;
|
||||||
|
|
||||||
if (address <= 0x16)
|
if (address <= 0x2e)
|
||||||
_uReturnValue = ((u16*)&pereg)[address >> 1];
|
_uReturnValue = ((u16*)&pereg)[address >> 1];
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -109,7 +111,7 @@ void Write16(const u16 _iValue, const u32 _iAddress)
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
default:
|
default:
|
||||||
if (address <= 0x16)
|
if (address <= 0x2e)
|
||||||
((u16*)&pereg)[address >> 1] = _iValue;
|
((u16*)&pereg)[address >> 1] = _iValue;
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
|
@ -38,6 +38,21 @@ namespace SWPixelEngine
|
||||||
PE_BBOX_RIGHT = 0x012, // Flip Right
|
PE_BBOX_RIGHT = 0x012, // Flip Right
|
||||||
PE_BBOX_TOP = 0x014, // Flip Top
|
PE_BBOX_TOP = 0x014, // Flip Top
|
||||||
PE_BBOX_BOTTOM = 0x016, // Flip Bottom
|
PE_BBOX_BOTTOM = 0x016, // Flip Bottom
|
||||||
|
|
||||||
|
// NOTE: Order not verified
|
||||||
|
// These indicate the number of quads that are being used as input/output for each particular stage
|
||||||
|
PE_PERF_ZCOMP_INPUT_ZCOMPLOC_L = 0x18,
|
||||||
|
PE_PERF_ZCOMP_INPUT_ZCOMPLOC_H = 0x1a,
|
||||||
|
PE_PERF_ZCOMP_OUTPUT_ZCOMPLOC_L = 0x1c,
|
||||||
|
PE_PERF_ZCOMP_OUTPUT_ZCOMPLOC_H = 0x1e,
|
||||||
|
PE_PERF_ZCOMP_INPUT_L = 0x20,
|
||||||
|
PE_PERF_ZCOMP_INPUT_H = 0x22,
|
||||||
|
PE_PERF_ZCOMP_OUTPUT_L = 0x24,
|
||||||
|
PE_PERF_ZCOMP_OUTPUT_H = 0x26,
|
||||||
|
PE_PERF_BLEND_INPUT_L = 0x28,
|
||||||
|
PE_PERF_BLEND_INPUT_H = 0x2a,
|
||||||
|
PE_PERF_EFB_COPY_CLOCKS_L = 0x2c,
|
||||||
|
PE_PERF_EFB_COPY_CLOCKS_H = 0x2e,
|
||||||
};
|
};
|
||||||
|
|
||||||
union UPEZConfReg
|
union UPEZConfReg
|
||||||
|
@ -125,10 +140,72 @@ namespace SWPixelEngine
|
||||||
UPECtrlReg ctrl;
|
UPECtrlReg ctrl;
|
||||||
u16 unk0;
|
u16 unk0;
|
||||||
u16 token;
|
u16 token;
|
||||||
|
|
||||||
u16 boxLeft;
|
u16 boxLeft;
|
||||||
u16 boxRight;
|
u16 boxRight;
|
||||||
u16 boxTop;
|
u16 boxTop;
|
||||||
u16 boxBottom;
|
u16 boxBottom;
|
||||||
|
|
||||||
|
u16 perfZcompInputZcomplocLo;
|
||||||
|
u16 perfZcompInputZcomplocHi;
|
||||||
|
u16 perfZcompOutputZcomplocLo;
|
||||||
|
u16 perfZcompOutputZcomplocHi;
|
||||||
|
u16 perfZcompInputLo;
|
||||||
|
u16 perfZcompInputHi;
|
||||||
|
u16 perfZcompOutputLo;
|
||||||
|
u16 perfZcompOutputHi;
|
||||||
|
u16 perfBlendInputLo;
|
||||||
|
u16 perfBlendInputHi;
|
||||||
|
u16 perfEfbCopyClocksLo;
|
||||||
|
u16 perfEfbCopyClocksHi;
|
||||||
|
|
||||||
|
// NOTE: hardware doesn't process individual pixels but quads instead. Current software renderer architecture works on pixels though, so we have this "quad" hack here to only increment the registers on every fourth rendered pixel
|
||||||
|
void IncZInputQuadCount(bool early_ztest)
|
||||||
|
{
|
||||||
|
static int quad = 0;
|
||||||
|
if (++quad != 3)
|
||||||
|
return;
|
||||||
|
quad = 0;
|
||||||
|
|
||||||
|
if (early_ztest)
|
||||||
|
{
|
||||||
|
if (++perfZcompInputZcomplocLo == 0)
|
||||||
|
perfZcompInputZcomplocHi++;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
if (++perfZcompInputLo == 0)
|
||||||
|
perfZcompInputHi++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
void IncZOutputQuadCount(bool early_ztest)
|
||||||
|
{
|
||||||
|
static int quad = 0;
|
||||||
|
if (++quad != 3)
|
||||||
|
return;
|
||||||
|
quad = 0;
|
||||||
|
|
||||||
|
if (early_ztest)
|
||||||
|
{
|
||||||
|
if (++perfZcompOutputZcomplocLo == 0)
|
||||||
|
perfZcompOutputZcomplocHi++;
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
if (++perfZcompOutputLo == 0)
|
||||||
|
perfZcompOutputHi++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
void IncBlendInputQuadCount()
|
||||||
|
{
|
||||||
|
static int quad = 0;
|
||||||
|
if (++quad != 3)
|
||||||
|
return;
|
||||||
|
quad = 0;
|
||||||
|
|
||||||
|
if (++perfBlendInputLo == 0)
|
||||||
|
perfBlendInputHi++;
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
extern PEReg pereg;
|
extern PEReg pereg;
|
||||||
|
|
|
@ -328,4 +328,15 @@ void SWVertexLoader::LoadTexCoord(SWVertexLoader *vertexLoader, InputVertexData
|
||||||
vertexLoader->m_texCoordLoader[index]();
|
vertexLoader->m_texCoordLoader[index]();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void SWVertexLoader::DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
p.DoArray(m_AttributeLoaders, sizeof m_AttributeLoaders);
|
||||||
|
p.Do(m_VertexSize);
|
||||||
|
p.Do(*m_CurrentVat);
|
||||||
|
p.Do(m_positionLoader);
|
||||||
|
p.Do(m_normalLoader);
|
||||||
|
p.DoArray(m_colorLoader, sizeof m_colorLoader);
|
||||||
|
p.Do(m_NumAttributeLoaders);
|
||||||
|
m_SetupUnit->DoState(p);
|
||||||
|
p.Do(m_TexGenSpecialCase);
|
||||||
|
}
|
|
@ -22,6 +22,7 @@
|
||||||
|
|
||||||
#include "NativeVertexFormat.h"
|
#include "NativeVertexFormat.h"
|
||||||
#include "CPMemLoader.h"
|
#include "CPMemLoader.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
class SetupUnit;
|
class SetupUnit;
|
||||||
|
|
||||||
|
@ -69,7 +70,7 @@ public:
|
||||||
u32 GetVertexSize() { return m_VertexSize; }
|
u32 GetVertexSize() { return m_VertexSize; }
|
||||||
|
|
||||||
void LoadVertex();
|
void LoadVertex();
|
||||||
|
void DoState(PointerWrap &p);
|
||||||
};
|
};
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -39,6 +39,9 @@
|
||||||
#include "FileUtil.h"
|
#include "FileUtil.h"
|
||||||
#include "VideoBackend.h"
|
#include "VideoBackend.h"
|
||||||
#include "Core.h"
|
#include "Core.h"
|
||||||
|
#include "OpcodeDecoder.h"
|
||||||
|
#include "SWVertexLoader.h"
|
||||||
|
#include "SWStatistics.h"
|
||||||
|
|
||||||
#define VSYNC_ENABLED 0
|
#define VSYNC_ENABLED 0
|
||||||
|
|
||||||
|
@ -93,9 +96,33 @@ bool VideoSoftware::Initialize(void *&window_handle)
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
|
|
||||||
void VideoSoftware::DoState(PointerWrap&)
|
void VideoSoftware::DoState(PointerWrap& p)
|
||||||
{
|
{
|
||||||
// NYI
|
bool software = true;
|
||||||
|
p.Do(software);
|
||||||
|
if (p.GetMode() == PointerWrap::MODE_READ && software == false)
|
||||||
|
// change mode to abort load of incompatible save state.
|
||||||
|
p.SetMode(PointerWrap::MODE_VERIFY);
|
||||||
|
|
||||||
|
// TODO: incomplete?
|
||||||
|
SWCommandProcessor::DoState(p);
|
||||||
|
SWPixelEngine::DoState(p);
|
||||||
|
EfbInterface::DoState(p);
|
||||||
|
OpcodeDecoder::DoState(p);
|
||||||
|
Clipper::DoState(p);
|
||||||
|
p.Do(swxfregs);
|
||||||
|
p.Do(bpmem);
|
||||||
|
p.Do(swstats);
|
||||||
|
|
||||||
|
// CP Memory
|
||||||
|
p.DoArray(arraybases, 16);
|
||||||
|
p.DoArray(arraystrides, 16);
|
||||||
|
p.Do(MatrixIndexA);
|
||||||
|
p.Do(MatrixIndexB);
|
||||||
|
p.Do(g_VtxDesc.Hex);
|
||||||
|
p.DoArray(g_VtxAttr, 8);
|
||||||
|
p.DoMarker("CP Memory");
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void VideoSoftware::CheckInvalidState()
|
void VideoSoftware::CheckInvalidState()
|
||||||
|
@ -198,6 +225,12 @@ u32 VideoSoftware::Video_AccessEFB(EFBAccessType type, u32 x, u32 y, u32 InputDa
|
||||||
return value;
|
return value;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
u32 VideoSoftware::Video_GetQueryResult(PerfQueryType type)
|
||||||
|
{
|
||||||
|
// TODO:
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
bool VideoSoftware::Video_Screenshot(const char *_szFilename)
|
bool VideoSoftware::Video_Screenshot(const char *_szFilename)
|
||||||
{
|
{
|
||||||
return false;
|
return false;
|
||||||
|
|
|
@ -25,13 +25,13 @@
|
||||||
|
|
||||||
void SetupUnit::Init(u8 primitiveType)
|
void SetupUnit::Init(u8 primitiveType)
|
||||||
{
|
{
|
||||||
m_PrimType = primitiveType;
|
m_PrimType = primitiveType;
|
||||||
|
|
||||||
m_VertexCounter = 0;
|
m_VertexCounter = 0;
|
||||||
m_VertPointer[0] = &m_Vertices[0];
|
m_VertPointer[0] = &m_Vertices[0];
|
||||||
m_VertPointer[1] = &m_Vertices[1];
|
m_VertPointer[1] = &m_Vertices[1];
|
||||||
m_VertPointer[2] = &m_Vertices[2];
|
m_VertPointer[2] = &m_Vertices[2];
|
||||||
m_VertWritePointer = m_VertPointer[0];
|
m_VertWritePointer = m_VertPointer[0];
|
||||||
}
|
}
|
||||||
|
|
||||||
void SetupUnit::SetupVertex()
|
void SetupUnit::SetupVertex()
|
||||||
|
@ -169,3 +169,21 @@ void SetupUnit::SetupLineStrip()
|
||||||
|
|
||||||
void SetupUnit::SetupPoint()
|
void SetupUnit::SetupPoint()
|
||||||
{}
|
{}
|
||||||
|
|
||||||
|
void SetupUnit::DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
// TODO: some or all of this is making the save states stop working once dolphin is closed...sometimes (usually)
|
||||||
|
// I have no idea what specifically is wrong, or if this is even important. Disabling it doesn't seem to make any noticible difference...
|
||||||
|
/* p.Do(m_PrimType);
|
||||||
|
p.Do(m_VertexCounter);
|
||||||
|
for (int i = 0; i < 3; ++i)
|
||||||
|
m_Vertices[i].DoState(p);
|
||||||
|
|
||||||
|
if (p.GetMode() == PointerWrap::MODE_READ)
|
||||||
|
{
|
||||||
|
m_VertPointer[0] = &m_Vertices[0];
|
||||||
|
m_VertPointer[1] = &m_Vertices[1];
|
||||||
|
m_VertPointer[2] = &m_Vertices[2];
|
||||||
|
m_VertWritePointer = m_VertPointer[0];
|
||||||
|
}*/
|
||||||
|
}
|
||||||
|
|
|
@ -21,6 +21,7 @@
|
||||||
|
|
||||||
#include "Common.h"
|
#include "Common.h"
|
||||||
#include "NativeVertexFormat.h"
|
#include "NativeVertexFormat.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
class SetupUnit
|
class SetupUnit
|
||||||
{
|
{
|
||||||
|
@ -45,6 +46,7 @@ public:
|
||||||
OutputVertexData* GetVertex() { return m_VertWritePointer; }
|
OutputVertexData* GetVertex() { return m_VertWritePointer; }
|
||||||
|
|
||||||
void SetupVertex();
|
void SetupVertex();
|
||||||
|
void DoState(PointerWrap &p);
|
||||||
};
|
};
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -20,6 +20,7 @@
|
||||||
#include "Tev.h"
|
#include "Tev.h"
|
||||||
#include "EfbInterface.h"
|
#include "EfbInterface.h"
|
||||||
#include "TextureSampler.h"
|
#include "TextureSampler.h"
|
||||||
|
#include "SWPixelEngine.h"
|
||||||
#include "SWStatistics.h"
|
#include "SWStatistics.h"
|
||||||
#include "SWVideoConfig.h"
|
#include "SWVideoConfig.h"
|
||||||
#include "DebugUtil.h"
|
#include "DebugUtil.h"
|
||||||
|
@ -787,8 +788,13 @@ void Tev::Draw()
|
||||||
bool late_ztest = !bpmem.zcontrol.early_ztest || !g_SWVideoConfig.bZComploc;
|
bool late_ztest = !bpmem.zcontrol.early_ztest || !g_SWVideoConfig.bZComploc;
|
||||||
if (late_ztest && bpmem.zmode.testenable)
|
if (late_ztest && bpmem.zmode.testenable)
|
||||||
{
|
{
|
||||||
if (!EfbInterface::ZCompare(Position[0], Position[1], Position[2]))
|
// TODO: Check against hw if these values get incremented even if depth testing is disabled
|
||||||
return;
|
SWPixelEngine::pereg.IncZInputQuadCount(false);
|
||||||
|
|
||||||
|
if (!EfbInterface::ZCompare(Position[0], Position[1], Position[2]))
|
||||||
|
return;
|
||||||
|
|
||||||
|
SWPixelEngine::pereg.IncZOutputQuadCount(false);
|
||||||
}
|
}
|
||||||
|
|
||||||
#if ALLOW_TEV_DUMPS
|
#if ALLOW_TEV_DUMPS
|
||||||
|
@ -812,6 +818,7 @@ void Tev::Draw()
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
INCSTAT(swstats.thisFrame.tevPixelsOut);
|
INCSTAT(swstats.thisFrame.tevPixelsOut);
|
||||||
|
SWPixelEngine::pereg.IncBlendInputQuadCount();
|
||||||
|
|
||||||
EfbInterface::BlendTev(Position[0], Position[1], output);
|
EfbInterface::BlendTev(Position[0], Position[1], output);
|
||||||
}
|
}
|
||||||
|
@ -827,3 +834,31 @@ void Tev::SetRegColor(int reg, int comp, bool konst, s16 color)
|
||||||
Reg[reg][comp] = color;
|
Reg[reg][comp] = color;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
void Tev::DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
p.DoArray(Reg, sizeof(Reg));
|
||||||
|
|
||||||
|
p.DoArray(KonstantColors, sizeof(KonstantColors));
|
||||||
|
p.DoArray(TexColor,4);
|
||||||
|
p.DoArray(RasColor,4);
|
||||||
|
p.DoArray(StageKonst,4);
|
||||||
|
p.DoArray(Zero16,4);
|
||||||
|
|
||||||
|
p.DoArray(FixedConstants,9);
|
||||||
|
p.Do(AlphaBump);
|
||||||
|
p.DoArray(IndirectTex, sizeof(IndirectTex));
|
||||||
|
p.Do(TexCoord);
|
||||||
|
|
||||||
|
p.DoArray(m_BiasLUT,4);
|
||||||
|
p.DoArray(m_ScaleLShiftLUT,4);
|
||||||
|
p.DoArray(m_ScaleRShiftLUT,4);
|
||||||
|
|
||||||
|
p.DoArray(Position,3);
|
||||||
|
p.DoArray(Color, sizeof(Color));
|
||||||
|
p.DoArray(Uv, 8);
|
||||||
|
p.DoArray(IndirectLod,4);
|
||||||
|
p.DoArray(IndirectLinear,4);
|
||||||
|
p.DoArray(TextureLod,16);
|
||||||
|
p.DoArray(TextureLinear,16);
|
||||||
|
}
|
||||||
|
|
|
@ -19,6 +19,7 @@
|
||||||
#define _TEV_H_
|
#define _TEV_H_
|
||||||
|
|
||||||
#include "BPMemLoader.h"
|
#include "BPMemLoader.h"
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
class Tev
|
class Tev
|
||||||
{
|
{
|
||||||
|
@ -96,6 +97,8 @@ public:
|
||||||
void SetRegColor(int reg, int comp, bool konst, s16 color);
|
void SetRegColor(int reg, int comp, bool konst, s16 color);
|
||||||
|
|
||||||
enum { ALP_C, BLU_C, GRN_C, RED_C };
|
enum { ALP_C, BLU_C, GRN_C, RED_C };
|
||||||
|
|
||||||
|
void DoState(PointerWrap &p);
|
||||||
};
|
};
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -20,6 +20,7 @@
|
||||||
|
|
||||||
#include <stdlib.h>
|
#include <stdlib.h>
|
||||||
#include <math.h>
|
#include <math.h>
|
||||||
|
#include "ChunkFile.h"
|
||||||
|
|
||||||
class Vec3
|
class Vec3
|
||||||
{
|
{
|
||||||
|
@ -111,6 +112,12 @@ public:
|
||||||
{
|
{
|
||||||
memset((void *)this,0,sizeof(float)*3);
|
memset((void *)this,0,sizeof(float)*3);
|
||||||
}
|
}
|
||||||
|
void DoState(PointerWrap &p)
|
||||||
|
{
|
||||||
|
p.Do(x);
|
||||||
|
p.Do(y);
|
||||||
|
p.Do(z);
|
||||||
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
#endif
|
#endif
|
||||||
|
|
|
@ -26,7 +26,9 @@ class VideoSoftware : public VideoBackend
|
||||||
void Video_ExitLoop();
|
void Video_ExitLoop();
|
||||||
void Video_BeginField(u32, FieldType, u32, u32);
|
void Video_BeginField(u32, FieldType, u32, u32);
|
||||||
void Video_EndField();
|
void Video_EndField();
|
||||||
|
|
||||||
u32 Video_AccessEFB(EFBAccessType, u32, u32, u32);
|
u32 Video_AccessEFB(EFBAccessType, u32, u32, u32);
|
||||||
|
u32 Video_GetQueryResult(PerfQueryType type);
|
||||||
|
|
||||||
void Video_AddMessage(const char* pstr, unsigned int milliseconds);
|
void Video_AddMessage(const char* pstr, unsigned int milliseconds);
|
||||||
void Video_ClearMessages();
|
void Video_ClearMessages();
|
||||||
|
|
Loading…
Reference in New Issue