Core/DSP: Access all registers except ST* through the regcache

No speed difference, probably because our basic blocks are
too small to contain more than one access to any register
or used too seldom for multiple accesses to make a difference.



git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@7260 8ced0084-cf51-0410-be5f-012b33b47a6e
This commit is contained in:
pierre 2011-02-27 18:04:35 +00:00
parent ff62f492e6
commit d56390407f
12 changed files with 1483 additions and 774 deletions

View File

@ -87,10 +87,11 @@ void DSPEmitter::checkExceptions(u32 retval)
MOV(16, M(&(g_dsp.pc)), Imm16(compilePC)); MOV(16, M(&(g_dsp.pc)), Imm16(compilePC));
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
SaveDSPRegs(); gpr.saveRegs();
ABI_CallFunction((void *)&DSPCore_CheckExceptions); ABI_CallFunction((void *)&DSPCore_CheckExceptions);
MOV(32, R(EAX), Imm32(retval)); MOV(32, R(EAX), Imm32(retval));
JMP(returnDispatcher, true); JMP(returnDispatcher, true);
gpr.loadRegs(false);
gpr.flushRegs(c,false); gpr.flushRegs(c,false);
SetJumpTarget(skipCheck); SetJumpTarget(skipCheck);
@ -107,9 +108,9 @@ void DSPEmitter::Default(UDSPInstruction inst)
} }
// Fall back to interpreter // Fall back to interpreter
SaveDSPRegs(); gpr.pushRegs();
ABI_CallFunctionC16((void*)opTable[inst]->intFunc, inst); ABI_CallFunctionC16((void*)opTable[inst]->intFunc, inst);
LoadDSPRegs(); gpr.popRegs();
} }
void DSPEmitter::EmitInstruction(UDSPInstruction inst) void DSPEmitter::EmitInstruction(UDSPInstruction inst)
@ -122,9 +123,9 @@ void DSPEmitter::EmitInstruction(UDSPInstruction inst)
if ((inst >> 12) == 0x3) { if ((inst >> 12) == 0x3) {
if (! extOpTable[inst & 0x7F]->jitFunc) { if (! extOpTable[inst & 0x7F]->jitFunc) {
// Fall back to interpreter // Fall back to interpreter
SaveDSPRegs(); gpr.pushRegs();
ABI_CallFunctionC16((void*)extOpTable[inst & 0x7F]->intFunc, inst); ABI_CallFunctionC16((void*)extOpTable[inst & 0x7F]->intFunc, inst);
LoadDSPRegs(); gpr.popRegs();
INFO_LOG(DSPLLE, "Instruction not JITed(ext part): %04x\n", inst); INFO_LOG(DSPLLE, "Instruction not JITed(ext part): %04x\n", inst);
ext_is_jit = false; ext_is_jit = false;
} else { } else {
@ -134,9 +135,9 @@ void DSPEmitter::EmitInstruction(UDSPInstruction inst)
} else { } else {
if (!extOpTable[inst & 0xFF]->jitFunc) { if (!extOpTable[inst & 0xFF]->jitFunc) {
// Fall back to interpreter // Fall back to interpreter
SaveDSPRegs(); gpr.pushRegs();
ABI_CallFunctionC16((void*)extOpTable[inst & 0xFF]->intFunc, inst); ABI_CallFunctionC16((void*)extOpTable[inst & 0xFF]->intFunc, inst);
LoadDSPRegs(); gpr.popRegs();
INFO_LOG(DSPLLE, "Instruction not JITed(ext part): %04x\n", inst); INFO_LOG(DSPLLE, "Instruction not JITed(ext part): %04x\n", inst);
ext_is_jit = false; ext_is_jit = false;
} else { } else {
@ -161,9 +162,9 @@ void DSPEmitter::EmitInstruction(UDSPInstruction inst)
if (!ext_is_jit) { if (!ext_is_jit) {
//need to call the online cleanup function because //need to call the online cleanup function because
//the writeBackLog gets populated at runtime //the writeBackLog gets populated at runtime
SaveDSPRegs(); gpr.pushRegs();
ABI_CallFunction((void*)::applyWriteBackLog); ABI_CallFunction((void*)::applyWriteBackLog);
LoadDSPRegs(); gpr.popRegs();
} else { } else {
popExtValueToReg(); popExtValueToReg();
} }
@ -189,10 +190,10 @@ void DSPEmitter::Compile(u16 start_addr)
return; return;
if (g_dsp.exceptions == 0) if (g_dsp.exceptions == 0)
return; return;
*/ */
LoadDSPRegs(); gpr.loadRegs();
blockLinkEntry = GetCodePtr(); blockLinkEntry = GetCodePtr();
@ -240,7 +241,7 @@ void DSPEmitter::Compile(u16 start_addr)
// end of each block and in this order // end of each block and in this order
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
HandleLoop(); HandleLoop();
SaveDSPRegs(); gpr.saveRegs();
if (!DSPHost_OnThread() && DSPAnalyzer::code_flags[start_addr] & DSPAnalyzer::CODE_IDLE_SKIP) if (!DSPHost_OnThread() && DSPAnalyzer::code_flags[start_addr] & DSPAnalyzer::CODE_IDLE_SKIP)
{ {
MOV(16, R(EAX), Imm16(DSP_IDLE_SKIP_CYCLES)); MOV(16, R(EAX), Imm16(DSP_IDLE_SKIP_CYCLES));
@ -250,6 +251,7 @@ void DSPEmitter::Compile(u16 start_addr)
MOV(16, R(EAX), Imm16(blockSize[start_addr])); MOV(16, R(EAX), Imm16(blockSize[start_addr]));
} }
JMP(returnDispatcher, true); JMP(returnDispatcher, true);
gpr.loadRegs(false);
gpr.flushRegs(c,false); gpr.flushRegs(c,false);
SetJumpTarget(rLoopAddressExit); SetJumpTarget(rLoopAddressExit);
@ -273,7 +275,7 @@ void DSPEmitter::Compile(u16 start_addr)
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
//don't update g_dsp.pc -- the branch insn already did //don't update g_dsp.pc -- the branch insn already did
SaveDSPRegs(); gpr.saveRegs();
if (!DSPHost_OnThread() && DSPAnalyzer::code_flags[start_addr] & DSPAnalyzer::CODE_IDLE_SKIP) if (!DSPHost_OnThread() && DSPAnalyzer::code_flags[start_addr] & DSPAnalyzer::CODE_IDLE_SKIP)
{ {
MOV(16, R(EAX), Imm16(DSP_IDLE_SKIP_CYCLES)); MOV(16, R(EAX), Imm16(DSP_IDLE_SKIP_CYCLES));
@ -283,6 +285,7 @@ void DSPEmitter::Compile(u16 start_addr)
MOV(16, R(EAX), Imm16(blockSize[start_addr])); MOV(16, R(EAX), Imm16(blockSize[start_addr]));
} }
JMP(returnDispatcher, true); JMP(returnDispatcher, true);
gpr.loadRegs(false);
gpr.flushRegs(c,false); gpr.flushRegs(c,false);
SetJumpTarget(rNoBranch); SetJumpTarget(rNoBranch);
@ -334,7 +337,7 @@ void DSPEmitter::Compile(u16 start_addr)
blockSize[start_addr] = 1; blockSize[start_addr] = 1;
} }
SaveDSPRegs(); gpr.saveRegs();
if (!DSPHost_OnThread() && DSPAnalyzer::code_flags[start_addr] & DSPAnalyzer::CODE_IDLE_SKIP) if (!DSPHost_OnThread() && DSPAnalyzer::code_flags[start_addr] & DSPAnalyzer::CODE_IDLE_SKIP)
{ {
MOV(16, R(EAX), Imm16(DSP_IDLE_SKIP_CYCLES)); MOV(16, R(EAX), Imm16(DSP_IDLE_SKIP_CYCLES));
@ -342,7 +345,7 @@ void DSPEmitter::Compile(u16 start_addr)
else else
{ {
MOV(16, R(EAX), Imm16(blockSize[start_addr])); MOV(16, R(EAX), Imm16(blockSize[start_addr]));
} }
JMP(returnDispatcher, true); JMP(returnDispatcher, true);
} }

View File

@ -52,8 +52,10 @@ public:
// CC Util // CC Util
void Update_SR_Register64(Gen::X64Reg val = Gen::EAX); void Update_SR_Register64(Gen::X64Reg val = Gen::EAX);
void Update_SR_Register64_Carry(Gen::X64Reg val = Gen::EAX); void Update_SR_Register64_Carry(Gen::X64Reg val,
void Update_SR_Register64_Carry2(Gen::X64Reg val = Gen::EAX); Gen::X64Reg carry_ovfl);
void Update_SR_Register64_Carry2(Gen::X64Reg val,
Gen::X64Reg carry_ovfl);
void Update_SR_Register16(Gen::X64Reg val = Gen::EAX); void Update_SR_Register16(Gen::X64Reg val = Gen::EAX);
void Update_SR_Register16_OverS32(Gen::X64Reg val = Gen::EAX); void Update_SR_Register16_OverS32(Gen::X64Reg val = Gen::EAX);
@ -65,13 +67,13 @@ public:
// Memory helper functions // Memory helper functions
void increment_addr_reg(int reg); void increment_addr_reg(int reg);
void decrement_addr_reg(int reg); void decrement_addr_reg(int reg);
void increase_addr_reg(int reg); void increase_addr_reg(int reg, int ix_reg);
void decrease_addr_reg(int reg); void decrease_addr_reg(int reg);
void imem_read(); void imem_read(Gen::X64Reg address);
void dmem_read(); void dmem_read(Gen::X64Reg address);
void dmem_read_imm(u16 addr); void dmem_read_imm(u16 addr);
void dmem_write(); void dmem_write(Gen::X64Reg value);
void dmem_write_imm(u16 addr); void dmem_write_imm(u16 addr, Gen::X64Reg value);
// Ext command helpers // Ext command helpers
void pushExtValueFromReg(u16 dreg, u16 sreg); void pushExtValueFromReg(u16 dreg, u16 sreg);
@ -250,6 +252,7 @@ public:
// CALL this to start the dispatcher // CALL this to start the dispatcher
const u8 *enterDispatcher; const u8 *enterDispatcher;
const u8 *reenterDispatcher;
const u8 *stubEntryPoint; const u8 *stubEntryPoint;
const u8 *returnDispatcher; const u8 *returnDispatcher;
u16 compilePC; u16 compilePC;
@ -259,10 +262,6 @@ public:
std::list<u16> *unresolvedJumps; std::list<u16> *unresolvedJumps;
DSPJitRegCache gpr; DSPJitRegCache gpr;
void LoadDSPRegs();
void SaveDSPRegs();
private: private:
DSPCompiledCode *blocks; DSPCompiledCode *blocks;
Block blockLinkEntry; Block blockLinkEntry;
@ -275,12 +274,8 @@ private:
// Counts down. // Counts down.
// int cycles; // int cycles;
void Update_SR_Register(Gen::X64Reg val = Gen::EAX); void Update_SR_Register(Gen::X64Reg val = Gen::EAX);
void ToMask(Gen::X64Reg value_reg = Gen::EDI);
void dsp_increment_one(Gen::X64Reg ar = Gen::EAX, Gen::X64Reg wr = Gen::EDX, Gen::X64Reg wr_pow = Gen::EDI, Gen::X64Reg temp_reg = Gen::ESI);
void dsp_decrement_one(Gen::X64Reg ar = Gen::EAX, Gen::X64Reg wr = Gen::EDX, Gen::X64Reg wr_pow = Gen::EDI, Gen::X64Reg temp_reg = Gen::ESI);
void get_long_prod(Gen::X64Reg long_prod = Gen::RAX); void get_long_prod(Gen::X64Reg long_prod = Gen::RAX);
void get_long_prod_round_prodl(Gen::X64Reg long_prod = Gen::RAX); void get_long_prod_round_prodl(Gen::X64Reg long_prod = Gen::RAX);
void set_long_prod(); void set_long_prod();

View File

@ -210,16 +210,19 @@ void DSPEmitter::cmp(const UDSPInstruction opc)
#ifdef _M_X64 #ifdef _M_X64
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc0 = dsp_get_long_acc(0); // s64 acc0 = dsp_get_long_acc(0);
get_long_acc(0, RCX); get_long_acc(0, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 acc1 = dsp_get_long_acc(1); // s64 acc1 = dsp_get_long_acc(1);
get_long_acc(1, RDX); get_long_acc(1, RDX);
// s64 res = dsp_convert_long_acc(acc0 - acc1); // s64 res = dsp_convert_long_acc(acc0 - acc1);
SUB(64, R(RAX), R(RDX)); SUB(64, R(RAX), R(RDX));
// Update_SR_Register64(res, isCarry2(acc0, res), isOverflow(acc0, -acc1, res)); // CF -> influence on ABS/0xa100 // Update_SR_Register64(res, isCarry2(acc0, res), isOverflow(acc0, -acc1, res)); // CF -> influence on ABS/0xa100
NEG(64, R(RDX)); NEG(64, R(RDX));
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
gpr.putXReg(tmp1);
} }
#else #else
Default(opc); Default(opc);
@ -227,7 +230,7 @@ void DSPEmitter::cmp(const UDSPInstruction opc)
} }
// CMPAR $acS axR.h // CMPAR $acS axR.h
// 1100 0001 xxxx xxxx // 110r s001 xxxx xxxx
// Compares accumulator $acS with accumulator axR.h. // Compares accumulator $acS with accumulator axR.h.
// Not described by Duddie's doc - at least not as a separate instruction. // Not described by Duddie's doc - at least not as a separate instruction.
// //
@ -240,9 +243,11 @@ void DSPEmitter::cmpar(const UDSPInstruction opc)
u8 rreg = ((opc >> 12) & 0x1); u8 rreg = ((opc >> 12) & 0x1);
u8 sreg = (opc >> 11) & 0x1; u8 sreg = (opc >> 11) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 sr = dsp_get_long_acc(sreg); // s64 sr = dsp_get_long_acc(sreg);
get_long_acc(sreg, RCX); get_long_acc(sreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 rr = (s16)g_dsp.r.axh[rreg]; // s64 rr = (s16)g_dsp.r.axh[rreg];
get_ax_h(rreg, RDX); get_ax_h(rreg, RDX);
// rr <<= 16; // rr <<= 16;
@ -251,7 +256,8 @@ void DSPEmitter::cmpar(const UDSPInstruction opc)
SUB(64, R(RAX), R(RDX)); SUB(64, R(RAX), R(RDX));
// Update_SR_Register64(res, isCarry2(sr, res), isOverflow(sr, -rr, res)); // Update_SR_Register64(res, isCarry2(sr, res), isOverflow(sr, -rr, res));
NEG(64, R(RDX)); NEG(64, R(RDX));
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
gpr.putXReg(tmp1);
} }
#else #else
Default(opc); Default(opc);
@ -271,9 +277,11 @@ void DSPEmitter::cmpi(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
u8 reg = (opc >> 8) & 0x1; u8 reg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 val = dsp_get_long_acc(reg); // s64 val = dsp_get_long_acc(reg);
get_long_acc(reg, RCX); get_long_acc(reg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 imm = (s64)(s16)dsp_fetch_code() << 16; // Immediate is considered to be at M level in the 40-bit accumulator. // s64 imm = (s64)(s16)dsp_fetch_code() << 16; // Immediate is considered to be at M level in the 40-bit accumulator.
u16 imm = dsp_imem_read(compilePC+1); u16 imm = dsp_imem_read(compilePC+1);
MOV(64, R(RDX), Imm64((s64)(s16)imm << 16)); MOV(64, R(RDX), Imm64((s64)(s16)imm << 16));
@ -281,7 +289,8 @@ void DSPEmitter::cmpi(const UDSPInstruction opc)
SUB(64, R(RAX), R(RDX)); SUB(64, R(RAX), R(RDX));
// Update_SR_Register64(res, isCarry2(val, res), isOverflow(val, -imm, res)); // Update_SR_Register64(res, isCarry2(val, res), isOverflow(val, -imm, res));
NEG(64, R(RDX)); NEG(64, R(RDX));
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
gpr.putXReg(tmp1);
} }
#else #else
Default(opc); Default(opc);
@ -302,8 +311,10 @@ void DSPEmitter::cmpis(const UDSPInstruction opc)
{ {
u8 areg = (opc >> 8) & 0x1; u8 areg = (opc >> 8) & 0x1;
// s64 acc = dsp_get_long_acc(areg); // s64 acc = dsp_get_long_acc(areg);
get_long_acc(areg, RCX); X64Reg tmp1;
MOV(64, R(RAX), R(RCX)); gpr.getFreeXReg(tmp1);
get_long_acc(areg, tmp1);
MOV(64, R(RAX), R(tmp1));
// s64 val = (s8)opc; // s64 val = (s8)opc;
// val <<= 16; // val <<= 16;
MOV(64, R(RDX), Imm64((s64)(s8)opc << 16)); MOV(64, R(RDX), Imm64((s64)(s8)opc << 16));
@ -311,7 +322,8 @@ void DSPEmitter::cmpis(const UDSPInstruction opc)
SUB(64, R(RAX), R(RDX)); SUB(64, R(RAX), R(RDX));
// Update_SR_Register64(res, isCarry2(acc, res), isOverflow(acc, -val, res)); // Update_SR_Register64(res, isCarry2(acc, res), isOverflow(acc, -val, res));
NEG(64, R(RDX)); NEG(64, R(RDX));
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
gpr.putXReg(tmp1);
} }
#else #else
Default(opc); Default(opc);
@ -341,7 +353,7 @@ void DSPEmitter::xorr(const UDSPInstruction opc)
// Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg))); // Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(dreg, RSI); get_long_acc(dreg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -370,7 +382,7 @@ void DSPEmitter::andr(const UDSPInstruction opc)
// Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg))); // Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(dreg, RSI); get_long_acc(dreg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -399,7 +411,7 @@ void DSPEmitter::orr(const UDSPInstruction opc)
// Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg))); // Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(dreg, RSI); get_long_acc(dreg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -427,7 +439,7 @@ void DSPEmitter::andc(const UDSPInstruction opc)
// Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg))); // Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(dreg, RSI); get_long_acc(dreg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -455,7 +467,7 @@ void DSPEmitter::orc(const UDSPInstruction opc)
// Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg))); // Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(dreg, RSI); get_long_acc(dreg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -482,7 +494,7 @@ void DSPEmitter::xorc(const UDSPInstruction opc)
// Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg))); // Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(dreg, RSI); get_long_acc(dreg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -508,7 +520,7 @@ void DSPEmitter::notc(const UDSPInstruction opc)
// Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg))); // Update_SR_Register16((s16)accm, false, false, isOverS32(dsp_get_long_acc(dreg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(dreg, RSI); get_long_acc(dreg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -536,7 +548,7 @@ void DSPEmitter::xori(const UDSPInstruction opc)
// Update_SR_Register16((s16)g_dsp.r.acm[reg], false, false, isOverS32(dsp_get_long_acc(reg))); // Update_SR_Register16((s16)g_dsp.r.acm[reg], false, false, isOverS32(dsp_get_long_acc(reg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(reg, RSI); get_long_acc(reg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -563,7 +575,7 @@ void DSPEmitter::andi(const UDSPInstruction opc)
// Update_SR_Register16((s16)g_dsp.r.acm[reg], false, false, isOverS32(dsp_get_long_acc(reg))); // Update_SR_Register16((s16)g_dsp.r.acm[reg], false, false, isOverS32(dsp_get_long_acc(reg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(reg, RSI); get_long_acc(reg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -590,7 +602,7 @@ void DSPEmitter::ori(const UDSPInstruction opc)
// Update_SR_Register16((s16)g_dsp.r.acm[reg], false, false, isOverS32(dsp_get_long_acc(reg))); // Update_SR_Register16((s16)g_dsp.r.acm[reg], false, false, isOverS32(dsp_get_long_acc(reg)));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_acc(reg, RSI); get_long_acc(reg, RCX);
Update_SR_Register16_OverS32(); Update_SR_Register16_OverS32();
} }
#else #else
@ -612,8 +624,10 @@ void DSPEmitter::addr(const UDSPInstruction opc)
u8 sreg = ((opc >> 9) & 0x3) + DSP_REG_AXL0; u8 sreg = ((opc >> 9) & 0x3) + DSP_REG_AXL0;
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); X64Reg tmp1;
MOV(64, R(RAX), R(RCX)); gpr.getFreeXReg(tmp1);
get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(tmp1));
// s64 ax = (s16)g_dsp.r[sreg]; // s64 ax = (s16)g_dsp.r[sreg];
dsp_op_read_reg(sreg, RDX, SIGN); dsp_op_read_reg(sreg, RDX, SIGN);
// ax <<= 16; // ax <<= 16;
@ -624,15 +638,15 @@ void DSPEmitter::addr(const UDSPInstruction opc)
// Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, ax, res)); // Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, ax, res));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -649,9 +663,11 @@ void DSPEmitter::addax(const UDSPInstruction opc)
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 ax = dsp_get_long_acx(sreg); // s64 ax = dsp_get_long_acx(sreg);
get_long_acx(sreg, RDX); get_long_acx(sreg, RDX);
// s64 res = acc + ax; // s64 res = acc + ax;
@ -661,14 +677,15 @@ void DSPEmitter::addax(const UDSPInstruction opc)
// Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, ax, res)); // Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, ax, res));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -684,9 +701,11 @@ void DSPEmitter::add(const UDSPInstruction opc)
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc0 = dsp_get_long_acc(dreg); // s64 acc0 = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 acc1 = dsp_get_long_acc(1 - dreg); // s64 acc1 = dsp_get_long_acc(1 - dreg);
get_long_acc(1 - dreg, RDX); get_long_acc(1 - dreg, RDX);
// s64 res = acc0 + acc1; // s64 res = acc0 + acc1;
@ -696,14 +715,15 @@ void DSPEmitter::add(const UDSPInstruction opc)
// Update_SR_Register64(res, isCarry(acc0, res), isOverflow(acc0, acc1, res)); // Update_SR_Register64(res, isCarry(acc0, res), isOverflow(acc0, acc1, res));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -719,9 +739,11 @@ void DSPEmitter::addp(const UDSPInstruction opc)
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 prod = dsp_get_long_prod(); // s64 prod = dsp_get_long_prod();
get_long_prod(RDX); get_long_prod(RDX);
// s64 res = acc + prod; // s64 res = acc + prod;
@ -731,14 +753,15 @@ void DSPEmitter::addp(const UDSPInstruction opc)
// Update_SR_Register64(res, isCarry2(acc, res), isOverflow(acc, prod, res)); // Update_SR_Register64(res, isCarry2(acc, res), isOverflow(acc, prod, res));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -756,9 +779,11 @@ void DSPEmitter::addaxl(const UDSPInstruction opc)
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// u64 acc = dsp_get_long_acc(dreg); // u64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// u16 acx = (u16)dsp_get_ax_l(sreg); // u16 acx = (u16)dsp_get_ax_l(sreg);
get_ax_l(sreg, RDX); get_ax_l(sreg, RDX);
// u64 res = acc + acx; // u64 res = acc + acx;
@ -768,14 +793,15 @@ void DSPEmitter::addaxl(const UDSPInstruction opc)
// Update_SR_Register64((s64)res, isCarry(acc, res), isOverflow((s64)acc, (s64)acx, (s64)res)); // Update_SR_Register64((s64)res, isCarry(acc, res), isOverflow((s64)acc, (s64)acx, (s64)res));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -791,9 +817,11 @@ void DSPEmitter::addi(const UDSPInstruction opc)
{ {
#ifdef _M_X64 #ifdef _M_X64
u8 areg = (opc >> 8) & 0x1; u8 areg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(areg); // s64 acc = dsp_get_long_acc(areg);
get_long_acc(areg, RCX); get_long_acc(areg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 imm = (s16)dsp_fetch_code(); // s64 imm = (s16)dsp_fetch_code();
s16 imm = dsp_imem_read(compilePC+1); s16 imm = dsp_imem_read(compilePC+1);
//imm <<= 16; //imm <<= 16;
@ -807,14 +835,15 @@ void DSPEmitter::addi(const UDSPInstruction opc)
// Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, imm, res)); // Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, imm, res));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(areg, RSI); set_long_acc(areg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(areg, RAX); set_long_acc(areg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -830,9 +859,11 @@ void DSPEmitter::addis(const UDSPInstruction opc)
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 imm = (s8)(u8)opc; // s64 imm = (s8)(u8)opc;
// imm <<= 16; // imm <<= 16;
MOV(8, R(RDX), Imm8((u8)opc)); MOV(8, R(RDX), Imm8((u8)opc));
@ -845,14 +876,15 @@ void DSPEmitter::addis(const UDSPInstruction opc)
// Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, imm, res)); // Update_SR_Register64(res, isCarry(acc, res), isOverflow(acc, imm, res));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -868,9 +900,11 @@ void DSPEmitter::incm(const UDSPInstruction opc)
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
s64 subtract = 0x10000; s64 subtract = 0x10000;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 res = acc + sub; // s64 res = acc + sub;
ADD(64, R(RAX), Imm32((u32)subtract)); ADD(64, R(RAX), Imm32((u32)subtract));
// dsp_set_long_acc(dreg, res); // dsp_set_long_acc(dreg, res);
@ -879,15 +913,15 @@ void DSPEmitter::incm(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RDX), Imm32((u32)subtract)); MOV(64, R(RDX), Imm32((u32)subtract));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg); set_long_acc(dreg);
Update_SR_Register64_Carry();
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -902,9 +936,11 @@ void DSPEmitter::inc(const UDSPInstruction opc)
{ {
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 res = acc + 1; // s64 res = acc + 1;
ADD(64, R(RAX), Imm8(1)); ADD(64, R(RAX), Imm8(1));
// dsp_set_long_acc(dreg, res); // dsp_set_long_acc(dreg, res);
@ -913,15 +949,16 @@ void DSPEmitter::inc(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RDX), Imm64(1)); MOV(64, R(RDX), Imm64(1));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg); set_long_acc(dreg);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);//why is this still done?
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -940,9 +977,11 @@ void DSPEmitter::subr(const UDSPInstruction opc)
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
u8 sreg = ((opc >> 9) & 0x3) + DSP_REG_AXL0; u8 sreg = ((opc >> 9) & 0x3) + DSP_REG_AXL0;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 ax = (s16)g_dsp.r[sreg]; // s64 ax = (s16)g_dsp.r[sreg];
dsp_op_read_reg(sreg, RDX, SIGN); dsp_op_read_reg(sreg, RDX, SIGN);
// ax <<= 16; // ax <<= 16;
@ -955,14 +994,15 @@ void DSPEmitter::subr(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
NEG(64, R(RDX)); NEG(64, R(RDX));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -979,9 +1019,11 @@ void DSPEmitter::subax(const UDSPInstruction opc)
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 acx = dsp_get_long_acx(sreg); // s64 acx = dsp_get_long_acx(sreg);
get_long_acx(sreg, RDX); get_long_acx(sreg, RDX);
// s64 res = acc - acx; // s64 res = acc - acx;
@ -992,14 +1034,15 @@ void DSPEmitter::subax(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
NEG(64, R(RDX)); NEG(64, R(RDX));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -1014,9 +1057,11 @@ void DSPEmitter::sub(const UDSPInstruction opc)
{ {
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc1 = dsp_get_long_acc(dreg); // s64 acc1 = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 acc2 = dsp_get_long_acc(1 - dreg); // s64 acc2 = dsp_get_long_acc(1 - dreg);
get_long_acc(1 - dreg, RDX); get_long_acc(1 - dreg, RDX);
// s64 res = acc1 - acc2; // s64 res = acc1 - acc2;
@ -1027,14 +1072,15 @@ void DSPEmitter::sub(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
NEG(64, R(RDX)); NEG(64, R(RDX));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -1049,9 +1095,11 @@ void DSPEmitter::subp(const UDSPInstruction opc)
{ {
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x1; u8 dreg = (opc >> 8) & 0x1;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 prod = dsp_get_long_prod(); // s64 prod = dsp_get_long_prod();
get_long_prod(RDX); get_long_prod(RDX);
// s64 res = acc - prod; // s64 res = acc - prod;
@ -1062,14 +1110,15 @@ void DSPEmitter::subp(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
NEG(64, R(RDX)); NEG(64, R(RDX));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -1085,9 +1134,11 @@ void DSPEmitter::decm(const UDSPInstruction opc)
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x01; u8 dreg = (opc >> 8) & 0x01;
s64 subtract = 0x10000; s64 subtract = 0x10000;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 res = acc - sub; // s64 res = acc - sub;
SUB(64, R(RAX), Imm32((u32)subtract)); SUB(64, R(RAX), Imm32((u32)subtract));
// dsp_set_long_acc(dreg, res); // dsp_set_long_acc(dreg, res);
@ -1096,14 +1147,15 @@ void DSPEmitter::decm(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RDX), Imm64(-subtract)); MOV(64, R(RDX), Imm64(-subtract));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -1118,9 +1170,11 @@ void DSPEmitter::dec(const UDSPInstruction opc)
{ {
#ifdef _M_X64 #ifdef _M_X64
u8 dreg = (opc >> 8) & 0x01; u8 dreg = (opc >> 8) & 0x01;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// s64 acc = dsp_get_long_acc(dreg); // s64 acc = dsp_get_long_acc(dreg);
get_long_acc(dreg, RCX); get_long_acc(dreg, tmp1);
MOV(64, R(RAX), R(RCX)); MOV(64, R(RAX), R(tmp1));
// s64 res = acc - 1; // s64 res = acc - 1;
SUB(64, R(RAX), Imm32(1)); SUB(64, R(RAX), Imm32(1));
// dsp_set_long_acc(dreg, res); // dsp_set_long_acc(dreg, res);
@ -1129,14 +1183,15 @@ void DSPEmitter::dec(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
MOV(64, R(RDX), Imm64(-1)); MOV(64, R(RDX), Imm64(-1));
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry2(); Update_SR_Register64_Carry2(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg); set_long_acc(dreg);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif

View File

@ -56,8 +56,8 @@ static void ReJitConditional(const UDSPInstruction opc, DSPEmitter& emitter)
emitter.TEST(16, R(EAX), Imm16(1)); emitter.TEST(16, R(EAX), Imm16(1));
//LE: problem in here, half the tests fail //LE: problem in here, half the tests fail
skipCode2 = emitter.J_CC(CC_NE); skipCode2 = emitter.J_CC(CC_NE, true);
//skipCode2 = emitter.J_CC((CCFlags)(CC_NE - (cond & 1))); //skipCode2 = emitter.J_CC((CCFlags)(CC_NE - (cond & 1)), true);
emitter.dsp_op_read_reg(DSP_REG_SR, RAX); emitter.dsp_op_read_reg(DSP_REG_SR, RAX);
emitter.TEST(16, R(EAX), Imm16(SR_ARITH_ZERO)); emitter.TEST(16, R(EAX), Imm16(SR_ARITH_ZERO));
break; break;
@ -94,7 +94,7 @@ static void ReJitConditional(const UDSPInstruction opc, DSPEmitter& emitter)
break; break;
//c2 = emitter.gpr; //c2 = emitter.gpr;
//emitter.TEST(16, R(EAX), Imm16(SR_OVER_S32 | SR_TOP2BITS)); //emitter.TEST(16, R(EAX), Imm16(SR_OVER_S32 | SR_TOP2BITS));
//skipCode2 = emitter.J_CC((CCFlags)(CC_E + (cond & 1))); //skipCode2 = emitter.J_CC((CCFlags)(CC_E + (cond & 1)), true);
//emitter.TEST(16, R(EAX), Imm16(SR_ARITH_ZERO)); //emitter.TEST(16, R(EAX), Imm16(SR_ARITH_ZERO));
//break; //break;
} }
@ -107,7 +107,7 @@ static void ReJitConditional(const UDSPInstruction opc, DSPEmitter& emitter)
break; break;
} }
DSPJitRegCache c1(emitter.gpr); DSPJitRegCache c1(emitter.gpr);
FixupBranch skipCode = cond == 0xe ? emitter.J_CC(CC_E) : emitter.J_CC((CCFlags)(CC_NE - (cond & 1))); FixupBranch skipCode = cond == 0xe ? emitter.J_CC(CC_E,true) : emitter.J_CC((CCFlags)(CC_NE - (cond & 1)),true);
jitCode(opc,emitter); jitCode(opc,emitter);
emitter.gpr.flushRegs(c1); emitter.gpr.flushRegs(c1);
emitter.SetJumpTarget(skipCode); emitter.SetJumpTarget(skipCode);
@ -121,7 +121,8 @@ static void ReJitConditional(const UDSPInstruction opc, DSPEmitter& emitter)
static void WriteBranchExit(DSPEmitter& emitter) static void WriteBranchExit(DSPEmitter& emitter)
{ {
emitter.SaveDSPRegs(); DSPJitRegCache c(emitter.gpr);
emitter.gpr.saveRegs();
if (DSPAnalyzer::code_flags[emitter.startAddr] & DSPAnalyzer::CODE_IDLE_SKIP) if (DSPAnalyzer::code_flags[emitter.startAddr] & DSPAnalyzer::CODE_IDLE_SKIP)
{ {
emitter.MOV(16, R(EAX), Imm16(0x1000)); emitter.MOV(16, R(EAX), Imm16(0x1000));
@ -131,6 +132,8 @@ static void WriteBranchExit(DSPEmitter& emitter)
emitter.MOV(16, R(EAX), Imm16(emitter.blockSize[emitter.startAddr])); emitter.MOV(16, R(EAX), Imm16(emitter.blockSize[emitter.startAddr]));
} }
emitter.JMP(emitter.returnDispatcher, true); emitter.JMP(emitter.returnDispatcher, true);
emitter.gpr.loadRegs(false);
emitter.gpr.flushRegs(c,false);
} }
static void WriteBlockLink(DSPEmitter& emitter, u16 dest) static void WriteBlockLink(DSPEmitter& emitter, u16 dest)
@ -142,12 +145,12 @@ static void WriteBlockLink(DSPEmitter& emitter, u16 dest)
{ {
emitter.gpr.flushRegs(); emitter.gpr.flushRegs();
// Check if we have enough cycles to execute the next block // Check if we have enough cycles to execute the next block
emitter.MOV(16, R(ESI), M(&cyclesLeft)); emitter.MOV(16, R(ECX), M(&cyclesLeft));
emitter.CMP(16, R(ESI), Imm16(emitter.blockSize[emitter.startAddr] + emitter.blockSize[dest])); emitter.CMP(16, R(ECX), Imm16(emitter.blockSize[emitter.startAddr] + emitter.blockSize[dest]));
FixupBranch notEnoughCycles = emitter.J_CC(CC_BE); FixupBranch notEnoughCycles = emitter.J_CC(CC_BE);
emitter.SUB(16, R(ESI), Imm16(emitter.blockSize[emitter.startAddr])); emitter.SUB(16, R(ECX), Imm16(emitter.blockSize[emitter.startAddr]));
emitter.MOV(16, M(&cyclesLeft), R(ESI)); emitter.MOV(16, M(&cyclesLeft), R(ECX));
emitter.JMP(emitter.blockLinks[dest], true); emitter.JMP(emitter.blockLinks[dest], true);
emitter.SetJumpTarget(notEnoughCycles); emitter.SetJumpTarget(notEnoughCycles);
} }
@ -339,9 +342,11 @@ void DSPEmitter::HandleLoop()
FixupBranch loopUpdated = J(true); FixupBranch loopUpdated = J(true);
SetJumpTarget(loadStack); SetJumpTarget(loadStack);
DSPJitRegCache c(gpr);
dsp_reg_load_stack(0); dsp_reg_load_stack(0);
dsp_reg_load_stack(2); dsp_reg_load_stack(2);
dsp_reg_load_stack(3); dsp_reg_load_stack(3);
gpr.flushRegs(c);
SetJumpTarget(loopUpdated); SetJumpTarget(loopUpdated);
SetJumpTarget(rLoopAddrG); SetJumpTarget(rLoopAddrG);

View File

@ -22,12 +22,12 @@
#include "../DSPIntUtil.h" #include "../DSPIntUtil.h"
#include "../DSPEmitter.h" #include "../DSPEmitter.h"
#include "DSPJitUtil.h"
#include "x64Emitter.h" #include "x64Emitter.h"
#include "ABI.h" #include "ABI.h"
using namespace Gen; using namespace Gen;
// In: RAX: s64 _Value // In: RAX: s64 _Value
// In: RCX: 1 = carry, 2 = overflow
// Clobbers RDX // Clobbers RDX
void DSPEmitter::Update_SR_Register(Gen::X64Reg val) void DSPEmitter::Update_SR_Register(Gen::X64Reg val)
{ {
@ -72,7 +72,6 @@ void DSPEmitter::Update_SR_Register(Gen::X64Reg val)
} }
// In: RAX: s64 _Value // In: RAX: s64 _Value
// In: RCX: 1 = carry, 2 = overflow
// Clobbers RDX // Clobbers RDX
void DSPEmitter::Update_SR_Register64(Gen::X64Reg val) void DSPEmitter::Update_SR_Register64(Gen::X64Reg val)
{ {
@ -86,18 +85,18 @@ void DSPEmitter::Update_SR_Register64(Gen::X64Reg val)
#endif #endif
} }
// In: RAX: s64 _Value // In: (val): s64 _Value
// In: RCX: 1 = carry, 2 = overflow // In: (carry_ovfl): 1 = carry, 2 = overflow
// Clobbers RDX // Clobbers RDX
void DSPEmitter::Update_SR_Register64_Carry(Gen::X64Reg val) void DSPEmitter::Update_SR_Register64_Carry(X64Reg val, X64Reg carry_ovfl)
{ {
#ifdef _M_X64 #ifdef _M_X64
OpArg sr_reg; OpArg sr_reg;
gpr.getReg(DSP_REG_SR,sr_reg); gpr.getReg(DSP_REG_SR,sr_reg);
// g_dsp.r[DSP_REG_SR] &= ~SR_CMP_MASK; // g_dsp.r[DSP_REG_SR] &= ~SR_CMP_MASK;
AND(16, sr_reg, Imm16(~SR_CMP_MASK)); AND(16, sr_reg, Imm16(~SR_CMP_MASK));
CMP(64, R(RCX), R(val)); CMP(64, R(carry_ovfl), R(val));
// 0x01 // 0x01
// g_dsp.r[DSP_REG_SR] |= SR_CARRY; // g_dsp.r[DSP_REG_SR] |= SR_CARRY;
@ -110,10 +109,10 @@ void DSPEmitter::Update_SR_Register64_Carry(Gen::X64Reg val)
// g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW; // g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW;
// g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW_STICKY; // g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW_STICKY;
// Overflow = ((acc ^ res) & (ax ^ res)) < 0 // Overflow = ((acc ^ res) & (ax ^ res)) < 0
XOR(64, R(RCX), R(val)); XOR(64, R(carry_ovfl), R(val));
XOR(64, R(RDX), R(val)); XOR(64, R(RDX), R(val));
AND(64, R(RCX), R(RDX)); AND(64, R(carry_ovfl), R(RDX));
CMP(64, R(RCX), Imm8(0)); CMP(64, R(carry_ovfl), Imm8(0));
FixupBranch noOverflow = J_CC(CC_GE); FixupBranch noOverflow = J_CC(CC_GE);
OR(16, sr_reg, Imm16(SR_OVERFLOW | SR_OVERFLOW_STICKY)); OR(16, sr_reg, Imm16(SR_OVERFLOW | SR_OVERFLOW_STICKY));
SetJumpTarget(noOverflow); SetJumpTarget(noOverflow);
@ -123,10 +122,10 @@ void DSPEmitter::Update_SR_Register64_Carry(Gen::X64Reg val)
#endif #endif
} }
// In: RAX: s64 _Value // In: (val): s64 _Value
// In: RCX: 1 = carry, 2 = overflow // In: (carry_ovfl): 1 = carry, 2 = overflow
// Clobbers RDX // Clobbers RDX
void DSPEmitter::Update_SR_Register64_Carry2(Gen::X64Reg val) void DSPEmitter::Update_SR_Register64_Carry2(X64Reg val, X64Reg carry_ovfl)
{ {
#ifdef _M_X64 #ifdef _M_X64
OpArg sr_reg; OpArg sr_reg;
@ -134,7 +133,7 @@ void DSPEmitter::Update_SR_Register64_Carry2(Gen::X64Reg val)
// g_dsp.r[DSP_REG_SR] &= ~SR_CMP_MASK; // g_dsp.r[DSP_REG_SR] &= ~SR_CMP_MASK;
AND(16, sr_reg, Imm16(~SR_CMP_MASK)); AND(16, sr_reg, Imm16(~SR_CMP_MASK));
CMP(64, R(RCX), R(val)); CMP(64, R(carry_ovfl), R(val));
// 0x01 // 0x01
// g_dsp.r[DSP_REG_SR] |= SR_CARRY; // g_dsp.r[DSP_REG_SR] |= SR_CARRY;
@ -147,10 +146,10 @@ void DSPEmitter::Update_SR_Register64_Carry2(Gen::X64Reg val)
// g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW; // g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW;
// g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW_STICKY; // g_dsp.r[DSP_REG_SR] |= SR_OVERFLOW_STICKY;
// Overflow = ((acc ^ res) & (ax ^ res)) < 0 // Overflow = ((acc ^ res) & (ax ^ res)) < 0
XOR(64, R(RCX), R(val)); XOR(64, R(carry_ovfl), R(val));
XOR(64, R(RDX), R(val)); XOR(64, R(RDX), R(val));
AND(64, R(RCX), R(RDX)); AND(64, R(carry_ovfl), R(RDX));
CMP(64, R(RCX), Imm8(0)); CMP(64, R(carry_ovfl), Imm8(0));
FixupBranch noOverflow = J_CC(CC_GE); FixupBranch noOverflow = J_CC(CC_GE);
OR(16, sr_reg, Imm16(SR_OVERFLOW | SR_OVERFLOW_STICKY)); OR(16, sr_reg, Imm16(SR_OVERFLOW | SR_OVERFLOW_STICKY));
SetJumpTarget(noOverflow); SetJumpTarget(noOverflow);
@ -171,9 +170,8 @@ void DSPEmitter::Update_SR_Register64_Carry2(Gen::X64Reg val)
//} //}
// In: RAX: s64 _Value // In: RAX: s64 _Value
// In: RCX: 1 = carry, 2 = overflow
// Clobbers RDX // Clobbers RDX
void DSPEmitter::Update_SR_Register16(Gen::X64Reg val) void DSPEmitter::Update_SR_Register16(X64Reg val)
{ {
#ifdef _M_X64 #ifdef _M_X64
OpArg sr_reg; OpArg sr_reg;
@ -214,7 +212,6 @@ void DSPEmitter::Update_SR_Register16(Gen::X64Reg val)
} }
// In: RAX: s64 _Value // In: RAX: s64 _Value
// In: RCX: 1 = carry, 2 = overflow
// Clobbers RDX // Clobbers RDX
void DSPEmitter::Update_SR_Register16_OverS32(Gen::X64Reg val) void DSPEmitter::Update_SR_Register16_OverS32(Gen::X64Reg val)
{ {
@ -225,8 +222,8 @@ void DSPEmitter::Update_SR_Register16_OverS32(Gen::X64Reg val)
// // 0x10 // // 0x10
// if (_Value != (s32)_Value) g_dsp.r[DSP_REG_SR] |= SR_OVER_S32; // if (_Value != (s32)_Value) g_dsp.r[DSP_REG_SR] |= SR_OVER_S32;
MOVSX(64, 32, RSI, R(val)); MOVSX(64, 32, RCX, R(val));
CMP(64, R(RSI), R(val)); CMP(64, R(RCX), R(val));
FixupBranch noOverS32 = J_CC(CC_E); FixupBranch noOverS32 = J_CC(CC_E);
OR(16, sr_reg, Imm16(SR_OVER_S32)); OR(16, sr_reg, Imm16(SR_OVER_S32));
SetJumpTarget(noOverS32); SetJumpTarget(noOverS32);

View File

@ -58,7 +58,7 @@ void DSPEmitter::ir(const UDSPInstruction opc) {
void DSPEmitter::nr(const UDSPInstruction opc) { void DSPEmitter::nr(const UDSPInstruction opc) {
u8 reg = opc & 0x3; u8 reg = opc & 0x3;
increase_addr_reg(reg); increase_addr_reg(reg, reg);
} }
// MV $axD.D, $acS.S // MV $axD.D, $acS.S
@ -81,9 +81,16 @@ void DSPEmitter::s(const UDSPInstruction opc)
u8 sreg = ((opc >> 3) & 0x3) + DSP_REG_ACL0; u8 sreg = ((opc >> 3) & 0x3) + DSP_REG_ACL0;
// u16 addr = g_dsp.r[dest]; // u16 addr = g_dsp.r[dest];
dsp_op_read_reg(dreg, RAX, ZERO); dsp_op_read_reg(dreg, RAX, ZERO);
dsp_op_read_reg(sreg, RCX, ZERO);
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1, ZERO);
// u16 val = g_dsp.r[src]; // u16 val = g_dsp.r[src];
dmem_write(); dmem_write(tmp1);
gpr.putXReg(tmp1);
increment_addr_reg(dreg); increment_addr_reg(dreg);
} }
@ -96,9 +103,16 @@ void DSPEmitter::sn(const UDSPInstruction opc)
u8 dreg = opc & 0x3; u8 dreg = opc & 0x3;
u8 sreg = ((opc >> 3) & 0x3) + DSP_REG_ACL0; u8 sreg = ((opc >> 3) & 0x3) + DSP_REG_ACL0;
dsp_op_read_reg(dreg, RAX, ZERO); dsp_op_read_reg(dreg, RAX, ZERO);
dsp_op_read_reg(sreg, RCX, ZERO);
dmem_write(); X64Reg tmp1;
increase_addr_reg(dreg); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1, ZERO);
dmem_write(tmp1);
gpr.putXReg(tmp1);
increase_addr_reg(dreg, dreg);
} }
// L $axD.D, @$arS // L $axD.D, @$arS
@ -117,7 +131,7 @@ void DSPEmitter::l(const UDSPInstruction opc)
//even if only for one bit, can only //even if only for one bit, can only
//store (up to) two registers in EBX, //store (up to) two registers in EBX,
//so store all of SR //so store all of SR
MOV(16, R(EAX), M(&g_dsp.r.sr)); dsp_op_read_reg(DSP_REG_SR, RAX);
SHL(32, R(EAX), Imm8(16)); SHL(32, R(EAX), Imm8(16));
OR(32, R(EBX), R(EAX)); OR(32, R(EBX), R(EAX));
} }
@ -141,12 +155,12 @@ void DSPEmitter::ln(const UDSPInstruction opc)
//even if only for one bit, can only //even if only for one bit, can only
//store (up to) two registers in EBX, //store (up to) two registers in EBX,
//so store all of SR //so store all of SR
MOV(16, R(EAX), M(&g_dsp.r.sr)); dsp_op_read_reg(DSP_REG_SR, RAX);
SHL(32, R(EAX), Imm8(16)); SHL(32, R(EAX), Imm8(16));
OR(32, R(EBX), R(EAX)); OR(32, R(EBX), R(EAX));
} }
increase_addr_reg(sreg); increase_addr_reg(sreg, sreg);
} }
// LS $axD.D, $acS.m // LS $axD.D, $acS.m
@ -159,8 +173,14 @@ void DSPEmitter::ls(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR0); pushExtValueFromMem(dreg, DSP_REG_AR0);
@ -180,13 +200,19 @@ void DSPEmitter::lsn(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR0); pushExtValueFromMem(dreg, DSP_REG_AR0);
increment_addr_reg(DSP_REG_AR3); increment_addr_reg(DSP_REG_AR3);
increase_addr_reg(DSP_REG_AR0); increase_addr_reg(DSP_REG_AR0, DSP_REG_AR0);
} }
// LSM $axD.D, $acS.m // LSM $axD.D, $acS.m
@ -200,12 +226,18 @@ void DSPEmitter::lsm(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR0); pushExtValueFromMem(dreg, DSP_REG_AR0);
increase_addr_reg(DSP_REG_AR3); increase_addr_reg(DSP_REG_AR3, DSP_REG_AR3);
increment_addr_reg(DSP_REG_AR0); increment_addr_reg(DSP_REG_AR0);
} }
@ -221,13 +253,19 @@ void DSPEmitter::lsnm(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR3, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR0); pushExtValueFromMem(dreg, DSP_REG_AR0);
increase_addr_reg(DSP_REG_AR3); increase_addr_reg(DSP_REG_AR3, DSP_REG_AR3);
increase_addr_reg(DSP_REG_AR0); increase_addr_reg(DSP_REG_AR0, DSP_REG_AR0);
} }
// SL $acS.m, $axD.D // SL $acS.m, $axD.D
@ -240,13 +278,19 @@ void DSPEmitter::sl(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR3); pushExtValueFromMem(dreg, DSP_REG_AR3);
increment_addr_reg(DSP_REG_AR3); increment_addr_reg(DSP_REG_AR3);
increment_addr_reg(DSP_REG_AR0); increment_addr_reg(DSP_REG_AR0);
} }
// SLN $acS.m, $axD.D // SLN $acS.m, $axD.D
@ -260,13 +304,19 @@ void DSPEmitter::sln(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR3); pushExtValueFromMem(dreg, DSP_REG_AR3);
increment_addr_reg(DSP_REG_AR3); increment_addr_reg(DSP_REG_AR3);
increase_addr_reg(DSP_REG_AR0); increase_addr_reg(DSP_REG_AR0, DSP_REG_AR0);
} }
// SLM $acS.m, $axD.D // SLM $acS.m, $axD.D
@ -280,12 +330,18 @@ void DSPEmitter::slm(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR3); pushExtValueFromMem(dreg, DSP_REG_AR3);
increase_addr_reg(DSP_REG_AR3); increase_addr_reg(DSP_REG_AR3, DSP_REG_AR3);
increment_addr_reg(DSP_REG_AR0); increment_addr_reg(DSP_REG_AR0);
} }
@ -300,13 +356,19 @@ void DSPEmitter::slnm(const UDSPInstruction opc)
u8 sreg = opc & 0x1; u8 sreg = opc & 0x1;
u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0; u8 dreg = ((opc >> 4) & 0x3) + DSP_REG_AXL0;
dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO); dsp_op_read_reg(DSP_REG_AR0, RAX, ZERO);
get_acc_m(sreg, ECX, false);
dmem_write(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_acc_m(sreg, tmp1, false);
dmem_write(tmp1);
gpr.putXReg(tmp1);
pushExtValueFromMem(dreg, DSP_REG_AR3); pushExtValueFromMem(dreg, DSP_REG_AR3);
increase_addr_reg(DSP_REG_AR3); increase_addr_reg(DSP_REG_AR3, DSP_REG_AR3);
increase_addr_reg(DSP_REG_AR0); increase_addr_reg(DSP_REG_AR0, DSP_REG_AR0);
} }
// LD $ax0.d, $ax1.r, @$arS // LD $ax0.d, $ax1.r, @$arS
@ -319,6 +381,9 @@ void DSPEmitter::slnm(const UDSPInstruction opc)
// points into an invalid memory page (ie 0x2000), then AX0.H keeps its old // points into an invalid memory page (ie 0x2000), then AX0.H keeps its old
// value. (not implemented yet) If AR3 points into an invalid memory page, then // value. (not implemented yet) If AR3 points into an invalid memory page, then
// AX0.L gets the same value as AX0.H. (not implemented yet) // AX0.L gets the same value as AX0.H. (not implemented yet)
// LD $axr.h, @$ard
// xxxx xxxx 11dr 0011
void DSPEmitter::ld(const UDSPInstruction opc) void DSPEmitter::ld(const UDSPInstruction opc)
{ {
u8 dreg = (opc >> 5) & 0x1; u8 dreg = (opc >> 5) & 0x1;
@ -329,12 +394,14 @@ void DSPEmitter::ld(const UDSPInstruction opc)
pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg); pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg);
// if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) { // if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(sreg, RSI, NONE); X64Reg tmp;
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); gpr.getFreeXReg(tmp);
SHR(16, R(ESI), Imm8(10)); dsp_op_read_reg(sreg, RCX, NONE);
SHR(16, R(EDI), Imm8(10)); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
XOR(16, R(ECX), R(tmp));
gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE,true); FixupBranch not_equal = J_CC(CC_NE,true);
pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg); pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -349,13 +416,15 @@ void DSPEmitter::ld(const UDSPInstruction opc)
} else { } else {
pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg); pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) { //if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(dreg, RSI, NONE); dsp_op_read_reg(dreg, RCX, NONE);
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
SHR(16, R(ESI), Imm8(10)); XOR(16, R(ECX), R(tmp));
SHR(16, R(EDI), Imm8(10)); gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE, true); FixupBranch not_equal = J_CC(CC_NE, true);
pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg); pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -382,13 +451,15 @@ void DSPEmitter::ldn(const UDSPInstruction opc)
if (sreg != DSP_REG_AR3) { if (sreg != DSP_REG_AR3) {
pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg); pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) { //if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(sreg, RSI, NONE); dsp_op_read_reg(sreg, RCX, NONE);
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
SHR(16, R(ESI), Imm8(10)); XOR(16, R(ECX), R(tmp));
SHR(16, R(EDI), Imm8(10)); gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE,true); FixupBranch not_equal = J_CC(CC_NE,true);
pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg); pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -398,17 +469,19 @@ void DSPEmitter::ldn(const UDSPInstruction opc)
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(after); SetJumpTarget(after);
increase_addr_reg(sreg); increase_addr_reg(sreg, sreg);
} else { } else {
pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg); pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) { //if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(dreg, RSI, NONE); dsp_op_read_reg(dreg, RCX, NONE);
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
SHR(16, R(ESI), Imm8(10)); XOR(16, R(ECX), R(tmp));
SHR(16, R(EDI), Imm8(10)); gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE,true); FixupBranch not_equal = J_CC(CC_NE,true);
pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg); pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -418,7 +491,7 @@ void DSPEmitter::ldn(const UDSPInstruction opc)
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(after); SetJumpTarget(after);
increase_addr_reg(dreg); increase_addr_reg(dreg, dreg);
} }
increment_addr_reg(DSP_REG_AR3); increment_addr_reg(DSP_REG_AR3);
@ -435,13 +508,15 @@ void DSPEmitter::ldm(const UDSPInstruction opc)
if (sreg != DSP_REG_AR3) { if (sreg != DSP_REG_AR3) {
pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg); pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) { //if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(sreg, RSI, NONE); dsp_op_read_reg(sreg, RCX, NONE);
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
SHR(16, R(ESI), Imm8(10)); XOR(16, R(ECX), R(tmp));
SHR(16, R(EDI), Imm8(10)); gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE,true); FixupBranch not_equal = J_CC(CC_NE,true);
pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg); pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -455,13 +530,15 @@ void DSPEmitter::ldm(const UDSPInstruction opc)
} else { } else {
pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg); pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) { //if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(dreg, RSI, NONE); dsp_op_read_reg(dreg, RCX, NONE);
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
SHR(16, R(ESI), Imm8(10)); XOR(16, R(ECX), R(tmp));
SHR(16, R(EDI), Imm8(10)); gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE,true); FixupBranch not_equal = J_CC(CC_NE,true);
pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg); pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -474,7 +551,7 @@ void DSPEmitter::ldm(const UDSPInstruction opc)
increment_addr_reg(dreg); increment_addr_reg(dreg);
} }
increase_addr_reg(DSP_REG_AR3); increase_addr_reg(DSP_REG_AR3, DSP_REG_AR3);
} }
// LDNM $ax0.d, $ax1.r, @$arS // LDNM $ax0.d, $ax1.r, @$arS
@ -488,13 +565,15 @@ void DSPEmitter::ldnm(const UDSPInstruction opc)
if (sreg != DSP_REG_AR3) { if (sreg != DSP_REG_AR3) {
pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg); pushExtValueFromMem((dreg << 1) + DSP_REG_AXL0, sreg);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) { //if (IsSameMemArea(g_dsp.r[sreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(sreg, RSI, NONE); dsp_op_read_reg(sreg, RCX, NONE);
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
SHR(16, R(ESI), Imm8(10)); XOR(16, R(ECX), R(tmp));
SHR(16, R(EDI), Imm8(10)); gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE,true); FixupBranch not_equal = J_CC(CC_NE,true);
pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg); pushExtValueFromMem2((rreg << 1) + DSP_REG_AXL1, sreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -504,17 +583,19 @@ void DSPEmitter::ldnm(const UDSPInstruction opc)
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(after); SetJumpTarget(after);
increase_addr_reg(sreg); increase_addr_reg(sreg, sreg);
} else { } else {
pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg); pushExtValueFromMem(rreg + DSP_REG_AXH0, dreg);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) { //if (IsSameMemArea(g_dsp.r[dreg], g_dsp.r[DSP_REG_AR3])) {
dsp_op_read_reg(dreg, RSI, NONE); dsp_op_read_reg(dreg, RCX, NONE);
dsp_op_read_reg(DSP_REG_AR3, RDI, NONE); dsp_op_read_reg(DSP_REG_AR3, tmp, NONE);
SHR(16, R(ESI), Imm8(10)); XOR(16, R(ECX), R(tmp));
SHR(16, R(EDI), Imm8(10)); gpr.putXReg(tmp);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
CMP(16, R(ESI), R(EDI)); TEST(16, R(ECX), Imm16(0xfc00));
FixupBranch not_equal = J_CC(CC_NE,true); FixupBranch not_equal = J_CC(CC_NE,true);
pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg); pushExtValueFromMem2(rreg + DSP_REG_AXL0, dreg);
gpr.flushRegs(c); gpr.flushRegs(c);
@ -524,10 +605,10 @@ void DSPEmitter::ldnm(const UDSPInstruction opc)
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(after); SetJumpTarget(after);
increase_addr_reg(dreg); increase_addr_reg(dreg, dreg);
} }
increase_addr_reg(DSP_REG_AR3); increase_addr_reg(DSP_REG_AR3, DSP_REG_AR3);
} }
@ -540,8 +621,15 @@ void DSPEmitter::pushExtValueFromReg(u16 dreg, u16 sreg) {
void DSPEmitter::pushExtValueFromMem(u16 dreg, u16 sreg) { void DSPEmitter::pushExtValueFromMem(u16 dreg, u16 sreg) {
// u16 addr = g_dsp.r[addr]; // u16 addr = g_dsp.r[addr];
dsp_op_read_reg(sreg, RCX, ZERO);
dmem_read(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1, ZERO);
dmem_read(tmp1);
gpr.putXReg(tmp1);
MOVZX(32, 16, EBX, R(EAX)); MOVZX(32, 16, EBX, R(EAX));
storeIndex = dreg; storeIndex = dreg;
@ -549,8 +637,15 @@ void DSPEmitter::pushExtValueFromMem(u16 dreg, u16 sreg) {
void DSPEmitter::pushExtValueFromMem2(u16 dreg, u16 sreg) { void DSPEmitter::pushExtValueFromMem2(u16 dreg, u16 sreg) {
// u16 addr = g_dsp.r[addr]; // u16 addr = g_dsp.r[addr];
dsp_op_read_reg(sreg, RCX, ZERO);
dmem_read(); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1, ZERO);
dmem_read(tmp1);
gpr.putXReg(tmp1);
SHL(32, R(EAX), Imm8(16)); SHL(32, R(EAX), Imm8(16));
OR(32, R(EBX), R(EAX)); OR(32, R(EBX), R(EAX));
@ -569,7 +664,7 @@ void DSPEmitter::popExtValueToReg() {
dsp_op_write_reg(storeIndex, RBX); dsp_op_write_reg(storeIndex, RBX);
if (storeIndex >= DSP_REG_ACM0 && storeIndex2 == -1) { if (storeIndex >= DSP_REG_ACM0 && storeIndex2 == -1) {
TEST(32, R(EBX), Imm32(SR_40_MODE_BIT << 16)); TEST(32, R(EBX), Imm32(SR_40_MODE_BIT << 16));
FixupBranch not_40bit = J_CC(CC_Z); FixupBranch not_40bit = J_CC(CC_Z, true);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
//if (g_dsp.r[DSP_REG_SR] & SR_40_MODE_BIT) //if (g_dsp.r[DSP_REG_SR] & SR_40_MODE_BIT)
//{ //{
@ -613,16 +708,16 @@ void DSPEmitter::zeroWriteBackLog(const UDSPInstruction opc)
if ((opc >> 12) == 0x3) { if ((opc >> 12) == 0x3) {
if (! extOpTable[opc & 0x7F]->jitFunc) if (! extOpTable[opc & 0x7F]->jitFunc)
{ {
SaveDSPRegs(); gpr.pushRegs();
ABI_CallFunction((void*)::zeroWriteBackLog); ABI_CallFunction((void*)::zeroWriteBackLog);
LoadDSPRegs(); gpr.popRegs();
} }
} else { } else {
if (! extOpTable[opc & 0xFF]->jitFunc) if (! extOpTable[opc & 0xFF]->jitFunc)
{ {
SaveDSPRegs(); gpr.pushRegs();
ABI_CallFunction((void*)::zeroWriteBackLog); ABI_CallFunction((void*)::zeroWriteBackLog);
LoadDSPRegs(); gpr.popRegs();
} }
} }
return; return;

View File

@ -35,11 +35,18 @@ void DSPEmitter::srs(const UDSPInstruction opc)
{ {
u8 reg = ((opc >> 8) & 0x7) + 0x18; u8 reg = ((opc >> 8) & 0x7) + 0x18;
//u16 addr = (g_dsp.r.cr << 8) | (opc & 0xFF); //u16 addr = (g_dsp.r.cr << 8) | (opc & 0xFF);
dsp_op_read_reg(reg, RCX, ZERO);
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(reg, tmp1, ZERO);
dsp_op_read_reg(DSP_REG_CR, RAX, ZERO); dsp_op_read_reg(DSP_REG_CR, RAX, ZERO);
SHL(16, R(EAX), Imm8(8)); SHL(16, R(EAX), Imm8(8));
OR(8, R(EAX), Imm8(opc & 0xFF)); OR(16, R(EAX), Imm16(opc & 0xFF));
dmem_write(); dmem_write(tmp1);
gpr.putXReg(tmp1);
} }
// LRS $(0x18+D), @M // LRS $(0x18+D), @M
@ -50,11 +57,18 @@ void DSPEmitter::srs(const UDSPInstruction opc)
void DSPEmitter::lrs(const UDSPInstruction opc) void DSPEmitter::lrs(const UDSPInstruction opc)
{ {
u8 reg = ((opc >> 8) & 0x7) + 0x18; u8 reg = ((opc >> 8) & 0x7) + 0x18;
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
//u16 addr = (g_dsp.r[DSP_REG_CR] << 8) | (opc & 0xFF); //u16 addr = (g_dsp.r[DSP_REG_CR] << 8) | (opc & 0xFF);
dsp_op_read_reg(DSP_REG_CR, RCX, ZERO); dsp_op_read_reg(DSP_REG_CR, tmp1, ZERO);
SHL(16, R(ECX), Imm8(8)); SHL(16, R(tmp1), Imm8(8));
OR(8, R(ECX), Imm8(opc & 0xFF)); OR(16, R(tmp1), Imm16(opc & 0xFF));
dmem_read(); dmem_read(tmp1);
gpr.putXReg(tmp1);
dsp_op_write_reg(reg, RAX); dsp_op_write_reg(reg, RAX);
dsp_conditional_extend_accum(reg); dsp_conditional_extend_accum(reg);
} }
@ -82,8 +96,14 @@ void DSPEmitter::sr(const UDSPInstruction opc)
{ {
u8 reg = opc & DSP_REG_MASK; u8 reg = opc & DSP_REG_MASK;
u16 address = dsp_imem_read(compilePC + 1); u16 address = dsp_imem_read(compilePC + 1);
dsp_op_read_reg(reg, ECX);
dmem_write_imm(address); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(reg, tmp1);
dmem_write_imm(address, tmp1);
gpr.putXReg(tmp1);
} }
// SI @M, #I // SI @M, #I
@ -95,8 +115,14 @@ void DSPEmitter::si(const UDSPInstruction opc)
{ {
u16 address = (s8)opc; u16 address = (s8)opc;
u16 imm = dsp_imem_read(compilePC + 1); u16 imm = dsp_imem_read(compilePC + 1);
MOV(32, R(ECX), Imm32((u32)imm));
dmem_write_imm(address); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
MOV(32, R(tmp1), Imm32((u32)imm));
dmem_write_imm(address, tmp1);
gpr.putXReg(tmp1);
} }
// LRR $D, @$S // LRR $D, @$S
@ -108,8 +134,14 @@ void DSPEmitter::lrr(const UDSPInstruction opc)
u8 sreg = (opc >> 5) & 0x3; u8 sreg = (opc >> 5) & 0x3;
u8 dreg = opc & 0x1f; u8 dreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
dmem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dmem_read(tmp1);
gpr.putXReg(tmp1);
dsp_op_write_reg(dreg, EAX); dsp_op_write_reg(dreg, EAX);
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
} }
@ -124,8 +156,14 @@ void DSPEmitter::lrrd(const UDSPInstruction opc)
u8 sreg = (opc >> 5) & 0x3; u8 sreg = (opc >> 5) & 0x3;
u8 dreg = opc & 0x1f; u8 dreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
dmem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dmem_read(tmp1);
gpr.putXReg(tmp1);
dsp_op_write_reg(dreg, EAX); dsp_op_write_reg(dreg, EAX);
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
decrement_addr_reg(sreg); decrement_addr_reg(sreg);
@ -141,8 +179,14 @@ void DSPEmitter::lrri(const UDSPInstruction opc)
u8 sreg = (opc >> 5) & 0x3; u8 sreg = (opc >> 5) & 0x3;
u8 dreg = opc & 0x1f; u8 dreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
dmem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dmem_read(tmp1);
gpr.putXReg(tmp1);
dsp_op_write_reg(dreg, EAX); dsp_op_write_reg(dreg, EAX);
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
increment_addr_reg(sreg); increment_addr_reg(sreg);
@ -158,11 +202,17 @@ void DSPEmitter::lrrn(const UDSPInstruction opc)
u8 sreg = (opc >> 5) & 0x3; u8 sreg = (opc >> 5) & 0x3;
u8 dreg = opc & 0x1f; u8 dreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
dmem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dmem_read(tmp1);
gpr.putXReg(tmp1);
dsp_op_write_reg(dreg, EAX); dsp_op_write_reg(dreg, EAX);
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
increase_addr_reg(sreg); increase_addr_reg(sreg, sreg);
} }
// SRR @$D, $S // SRR @$D, $S
@ -175,9 +225,14 @@ void DSPEmitter::srr(const UDSPInstruction opc)
u8 dreg = (opc >> 5) & 0x3; u8 dreg = (opc >> 5) & 0x3;
u8 sreg = opc & 0x1f; u8 sreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dsp_op_read_reg(dreg, RAX, ZERO); dsp_op_read_reg(dreg, RAX, ZERO);
dmem_write(); dmem_write(tmp1);
gpr.putXReg(tmp1);
} }
// SRRD @$D, $S // SRRD @$D, $S
@ -190,9 +245,15 @@ void DSPEmitter::srrd(const UDSPInstruction opc)
u8 dreg = (opc >> 5) & 0x3; u8 dreg = (opc >> 5) & 0x3;
u8 sreg = opc & 0x1f; u8 sreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dsp_op_read_reg(dreg, RAX, ZERO); dsp_op_read_reg(dreg, RAX, ZERO);
dmem_write(); dmem_write(tmp1);
gpr.putXReg(tmp1);
decrement_addr_reg(dreg); decrement_addr_reg(dreg);
} }
@ -206,9 +267,15 @@ void DSPEmitter::srri(const UDSPInstruction opc)
u8 dreg = (opc >> 5) & 0x3; u8 dreg = (opc >> 5) & 0x3;
u8 sreg = opc & 0x1f; u8 sreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dsp_op_read_reg(dreg, RAX, ZERO); dsp_op_read_reg(dreg, RAX, ZERO);
dmem_write(); dmem_write(tmp1);
gpr.putXReg(tmp1);
increment_addr_reg(dreg); increment_addr_reg(dreg);
} }
@ -222,10 +289,16 @@ void DSPEmitter::srrn(const UDSPInstruction opc)
u8 dreg = (opc >> 5) & 0x3; u8 dreg = (opc >> 5) & 0x3;
u8 sreg = opc & 0x1f; u8 sreg = opc & 0x1f;
dsp_op_read_reg(sreg, ECX); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
dsp_op_read_reg(sreg, tmp1);
dsp_op_read_reg(dreg, RAX, ZERO); dsp_op_read_reg(dreg, RAX, ZERO);
dmem_write(); dmem_write(tmp1);
increase_addr_reg(dreg);
gpr.putXReg(tmp1);
increase_addr_reg(dreg, dreg);
} }
// ILRR $acD.m, @$arS // ILRR $acD.m, @$arS
@ -237,8 +310,14 @@ void DSPEmitter::ilrr(const UDSPInstruction opc)
u16 reg = opc & 0x3; u16 reg = opc & 0x3;
u16 dreg = (opc >> 8) & 1; u16 dreg = (opc >> 8) & 1;
dsp_op_read_reg(reg, RCX, ZERO); X64Reg tmp1;
imem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(reg, tmp1, ZERO);
imem_read(tmp1);
gpr.putXReg(tmp1);
set_acc_m(dreg, R(RAX)); set_acc_m(dreg, R(RAX));
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
} }
@ -252,8 +331,14 @@ void DSPEmitter::ilrrd(const UDSPInstruction opc)
u16 reg = opc & 0x3; u16 reg = opc & 0x3;
u16 dreg = (opc >> 8) & 1; u16 dreg = (opc >> 8) & 1;
dsp_op_read_reg(reg, RCX, ZERO); X64Reg tmp1;
imem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(reg, tmp1, ZERO);
imem_read(tmp1);
gpr.putXReg(tmp1);
set_acc_m(dreg, R(RAX)); set_acc_m(dreg, R(RAX));
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
decrement_addr_reg(reg); decrement_addr_reg(reg);
@ -268,8 +353,14 @@ void DSPEmitter::ilrri(const UDSPInstruction opc)
u16 reg = opc & 0x3; u16 reg = opc & 0x3;
u16 dreg = (opc >> 8) & 1; u16 dreg = (opc >> 8) & 1;
dsp_op_read_reg(reg, RCX, ZERO); X64Reg tmp1;
imem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(reg, tmp1, ZERO);
imem_read(tmp1);
gpr.putXReg(tmp1);
set_acc_m(dreg, R(RAX)); set_acc_m(dreg, R(RAX));
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
increment_addr_reg(reg); increment_addr_reg(reg);
@ -285,10 +376,16 @@ void DSPEmitter::ilrrn(const UDSPInstruction opc)
u16 reg = opc & 0x3; u16 reg = opc & 0x3;
u16 dreg = (opc >> 8) & 1; u16 dreg = (opc >> 8) & 1;
dsp_op_read_reg(reg, RCX, ZERO); X64Reg tmp1;
imem_read(); gpr.getFreeXReg(tmp1);
dsp_op_read_reg(reg, tmp1, ZERO);
imem_read(tmp1);
gpr.putXReg(tmp1);
set_acc_m(dreg, R(RAX)); set_acc_m(dreg, R(RAX));
dsp_conditional_extend_accum(dreg); dsp_conditional_extend_accum(dreg);
increase_addr_reg(reg); increase_addr_reg(reg, reg);
} }

View File

@ -25,7 +25,7 @@ using namespace Gen;
//clobbers: //clobbers:
//EAX = (s8)g_dsp.reg_stack_ptr[stack_reg] //EAX = (s8)g_dsp.reg_stack_ptr[stack_reg]
//CX = g_dsp.reg_stack[stack_reg][g_dsp.reg_stack_ptr[stack_reg]] //expects:
void DSPEmitter::dsp_reg_stack_push(int stack_reg) void DSPEmitter::dsp_reg_stack_push(int stack_reg)
{ {
//g_dsp.reg_stack_ptr[stack_reg]++; //g_dsp.reg_stack_ptr[stack_reg]++;
@ -35,30 +35,38 @@ void DSPEmitter::dsp_reg_stack_push(int stack_reg)
AND(8, R(AL), Imm8(DSP_STACK_MASK)); AND(8, R(AL), Imm8(DSP_STACK_MASK));
MOV(8, M(&g_dsp.reg_stack_ptr[stack_reg]), R(AL)); MOV(8, M(&g_dsp.reg_stack_ptr[stack_reg]), R(AL));
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
//g_dsp.reg_stack[stack_reg][g_dsp.reg_stack_ptr[stack_reg]] = g_dsp.r[DSP_REG_ST0 + stack_reg]; //g_dsp.reg_stack[stack_reg][g_dsp.reg_stack_ptr[stack_reg]] = g_dsp.r[DSP_REG_ST0 + stack_reg];
MOV(16, R(CX), M(&g_dsp.r.st[stack_reg])); MOV(16, R(tmp1), M(&g_dsp.r.st[stack_reg]));
#ifdef _M_IX86 // All32 #ifdef _M_IX86 // All32
MOVZX(32, 8, EAX, R(AL)); MOVZX(32, 8, EAX, R(AL));
#else #else
MOVZX(64, 8, RAX, R(AL)); MOVZX(64, 8, RAX, R(AL));
#endif #endif
MOV(16, MComplex(EAX, EAX, 1, (u64)&g_dsp.reg_stack[stack_reg][0]), R(CX)); MOV(16, MComplex(EAX, EAX, 1,
PtrOffset(&g_dsp.reg_stack[stack_reg][0],0)), R(tmp1));
gpr.putXReg(tmp1);
} }
//clobbers: //clobbers:
//EAX = (s8)g_dsp.reg_stack_ptr[stack_reg] //EAX = (s8)g_dsp.reg_stack_ptr[stack_reg]
//CX = g_dsp.reg_stack[stack_reg][g_dsp.reg_stack_ptr[stack_reg]] //expects:
void DSPEmitter::dsp_reg_stack_pop(int stack_reg) void DSPEmitter::dsp_reg_stack_pop(int stack_reg)
{ {
//g_dsp.r[DSP_REG_ST0 + stack_reg] = g_dsp.reg_stack[stack_reg][g_dsp.reg_stack_ptr[stack_reg]]; //g_dsp.r[DSP_REG_ST0 + stack_reg] = g_dsp.reg_stack[stack_reg][g_dsp.reg_stack_ptr[stack_reg]];
MOV(8, R(AL), M(&g_dsp.reg_stack_ptr[stack_reg])); MOV(8, R(AL), M(&g_dsp.reg_stack_ptr[stack_reg]));
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
#ifdef _M_IX86 // All32 #ifdef _M_IX86 // All32
MOVZX(32, 8, EAX, R(AL)); MOVZX(32, 8, EAX, R(AL));
#else #else
MOVZX(64, 8, RAX, R(AL)); MOVZX(64, 8, RAX, R(AL));
#endif #endif
MOV(16, R(CX), MComplex(EAX, EAX, 1, (u64)&g_dsp.reg_stack[stack_reg][0])); MOV(16, R(tmp1), MComplex(EAX, EAX, 1,
MOV(16, M(&g_dsp.r.st[stack_reg]), R(CX)); PtrOffset(&g_dsp.reg_stack[stack_reg][0],0)));
MOV(16, M(&g_dsp.r.st[stack_reg]), R(tmp1));
gpr.putXReg(tmp1);
//g_dsp.reg_stack_ptr[stack_reg]--; //g_dsp.reg_stack_ptr[stack_reg]--;
//g_dsp.reg_stack_ptr[stack_reg] &= DSP_STACK_MASK; //g_dsp.reg_stack_ptr[stack_reg] &= DSP_STACK_MASK;
@ -165,7 +173,7 @@ void DSPEmitter::dsp_conditional_extend_accum(int reg)
//} //}
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(not_40bit); SetJumpTarget(not_40bit);
gpr.putReg(DSP_REG_SR); gpr.putReg(DSP_REG_SR, false);
} }
} }
} }
@ -181,7 +189,7 @@ void DSPEmitter::dsp_conditional_extend_accum_imm(int reg, u16 val)
gpr.getReg(DSP_REG_SR,sr_reg); gpr.getReg(DSP_REG_SR,sr_reg);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
TEST(16, sr_reg, Imm16(SR_40_MODE_BIT)); TEST(16, sr_reg, Imm16(SR_40_MODE_BIT));
FixupBranch not_40bit = J_CC(CC_Z); FixupBranch not_40bit = J_CC(CC_Z, true);
//if (g_dsp.r[DSP_REG_SR] & SR_40_MODE_BIT) //if (g_dsp.r[DSP_REG_SR] & SR_40_MODE_BIT)
//{ //{
// Sign extend into whole accum. // Sign extend into whole accum.
@ -192,7 +200,7 @@ void DSPEmitter::dsp_conditional_extend_accum_imm(int reg, u16 val)
//} //}
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(not_40bit); SetJumpTarget(not_40bit);
gpr.putReg(DSP_REG_SR); gpr.putReg(DSP_REG_SR, false);
} }
} }
} }
@ -327,9 +335,9 @@ void DSPEmitter::addarn(const UDSPInstruction opc)
// u8 dreg = opc & 0x3; // u8 dreg = opc & 0x3;
// u8 sreg = (opc >> 2) & 0x3; // u8 sreg = (opc >> 2) & 0x3;
// g_dsp.r[dreg] = dsp_increase_addr_reg(dreg, (s16)g_dsp.r[DSP_REG_IX0 + sreg]); // g_dsp.r[dreg] = dsp_increase_addr_reg(dreg, (s16)g_dsp.r[DSP_REG_IX0 + sreg]);
// From looking around it is always called with the matching index register // From looking around it is always called with the matching index register
increase_addr_reg(opc & 0x3); increase_addr_reg(opc & 0x3, (opc >> 2) & 0x3);
} }
//---- //----

View File

@ -31,13 +31,12 @@
using namespace Gen; using namespace Gen;
// Returns s64 in RAX // Returns s64 in RAX
// In: RSI = s16 a, RDI = s16 b // In: RCX = s16 a, RAX = s16 b
void DSPEmitter::multiply() void DSPEmitter::multiply()
{ {
#ifdef _M_X64 #ifdef _M_X64
// prod = (s16)a * (s16)b; //signed // prod = (s16)a * (s16)b; //signed
MOV(64, R(EAX), R(RDI)); IMUL(64, R(ECX));
IMUL(64, R(ESI));
// Conditionally multiply by 2. // Conditionally multiply by 2.
// if ((g_dsp.r.sr & SR_MUL_MODIFY) == 0) // if ((g_dsp.r.sr & SR_MUL_MODIFY) == 0)
@ -46,9 +45,9 @@ void DSPEmitter::multiply()
TEST(16, sr_reg, Imm16(SR_MUL_MODIFY)); TEST(16, sr_reg, Imm16(SR_MUL_MODIFY));
FixupBranch noMult2 = J_CC(CC_NZ); FixupBranch noMult2 = J_CC(CC_NZ);
// prod <<= 1; // prod <<= 1;
SHL(64, R(EAX), Imm8(1)); LEA(64, RAX, MRegSum(RAX,RAX));
SetJumpTarget(noMult2); SetJumpTarget(noMult2);
gpr.putReg(DSP_REG_SR); gpr.putReg(DSP_REG_SR, false);
// return prod; // return prod;
#endif #endif
} }
@ -60,7 +59,7 @@ void DSPEmitter::multiply_add()
// s64 prod = dsp_get_long_prod() + dsp_get_multiply_prod(a, b, sign); // s64 prod = dsp_get_long_prod() + dsp_get_multiply_prod(a, b, sign);
multiply(); multiply();
MOV(64, R(RDX), R(RAX)); MOV(64, R(RDX), R(RAX));
get_long_prod(); get_long_prod();
ADD(64, R(RAX), R(RDX)); ADD(64, R(RAX), R(RDX));
// return prod; // return prod;
} }
@ -72,14 +71,14 @@ void DSPEmitter::multiply_sub()
// s64 prod = dsp_get_long_prod() - dsp_get_multiply_prod(a, b, sign); // s64 prod = dsp_get_long_prod() - dsp_get_multiply_prod(a, b, sign);
multiply(); multiply();
MOV(64, R(RDX), R(RAX)); MOV(64, R(RDX), R(RAX));
get_long_prod(); get_long_prod();
SUB(64, R(RAX), R(RDX)); SUB(64, R(RAX), R(RDX));
// return prod; // return prod;
} }
// Only MULX family instructions have unsigned/mixed support. // Only MULX family instructions have unsigned/mixed support.
// Returns s64 in EAX // Returns s64 in EAX
// In: RSI = s16 a, RDI = s16 b // In: RCX = s16 a, RAX = s16 b
// Returns s64 in RAX // Returns s64 in RAX
void DSPEmitter::multiply_mulx(u8 axh0, u8 axh1) void DSPEmitter::multiply_mulx(u8 axh0, u8 axh1)
{ {
@ -101,41 +100,48 @@ void DSPEmitter::multiply_mulx(u8 axh0, u8 axh1)
TEST(16, sr_reg, Imm16(SR_MUL_UNSIGNED)); TEST(16, sr_reg, Imm16(SR_MUL_UNSIGNED));
FixupBranch unsignedMul = J_CC(CC_NZ); FixupBranch unsignedMul = J_CC(CC_NZ);
// prod = (s16)a * (s16)b; //signed // prod = (s16)a * (s16)b; //signed
MOVSX(64, 16, RAX, R(RDI)); MOVSX(64, 16, RAX, R(RAX));
IMUL(64, R(RSI)); IMUL(64, R(RCX));
FixupBranch signedMul = J(); FixupBranch signedMul = J(true);
SetJumpTarget(unsignedMul); SetJumpTarget(unsignedMul);
DSPJitRegCache c(gpr);
gpr.putReg(DSP_REG_SR, false);
if ((axh0==0) && (axh1==0)) if ((axh0==0) && (axh1==0))
{ {
// unsigned support ON if both ax?.l regs are used // unsigned support ON if both ax?.l regs are used
// prod = (u32)(a * b); // prod = (u32)(a * b);
MOVZX(64, 16, RSI, R(RSI)); MOVZX(64, 16, RCX, R(RCX));
MOVZX(64, 16, RAX, R(RDI)); MOVZX(64, 16, RAX, R(RAX));
MUL(64, R(RSI)); MUL(64, R(RCX));
} }
else if ((axh0==0) && (axh1==1)) else if ((axh0==0) && (axh1==1))
{ {
// mixed support ON (u16)axl.0 * (s16)axh.1 // mixed support ON (u16)axl.0 * (s16)axh.1
// prod = a * (s16)b; // prod = a * (s16)b;
MOVZX(64, 16, RAX, R(RSI)); X64Reg tmp;
IMUL(64, R(RDI)); gpr.getFreeXReg(tmp);
MOV(64, R(tmp), R(RAX));
MOVZX(64, 16, RAX, R(RCX));
IMUL(64, R(tmp));
gpr.putXReg(tmp);
} }
else if ((axh0==1) && (axh1==0)) else if ((axh0==1) && (axh1==0))
{ {
// mixed support ON (u16)axl.1 * (s16)axh.0 // mixed support ON (u16)axl.1 * (s16)axh.0
// prod = (s16)a * b; // prod = (s16)a * b;
MOVZX(64, 16, RAX, R(RDI)); MOVZX(64, 16, RAX, R(RAX));
IMUL(64, R(RSI)); IMUL(64, R(RCX));
} }
else else
{ {
// unsigned support OFF if both ax?.h regs are used // unsigned support OFF if both ax?.h regs are used
// prod = (s16)a * (s16)b; //signed // prod = (s16)a * (s16)b; //signed
MOVSX(64, 16, RAX, R(RDI)); MOVSX(64, 16, RAX, R(RAX));
IMUL(64, R(RSI)); IMUL(64, R(RCX));
} }
gpr.flushRegs(c);
SetJumpTarget(signedMul); SetJumpTarget(signedMul);
// Conditionally multiply by 2. // Conditionally multiply by 2.
@ -143,9 +149,9 @@ void DSPEmitter::multiply_mulx(u8 axh0, u8 axh1)
TEST(16, sr_reg, Imm16(SR_MUL_MODIFY)); TEST(16, sr_reg, Imm16(SR_MUL_MODIFY));
FixupBranch noMult2 = J_CC(CC_NZ); FixupBranch noMult2 = J_CC(CC_NZ);
// prod <<= 1; // prod <<= 1;
SHL(64, R(RAX), Imm8(1)); LEA(64, RAX, MRegSum(RAX,RAX));
SetJumpTarget(noMult2); SetJumpTarget(noMult2);
gpr.putReg(DSP_REG_SR); gpr.putReg(DSP_REG_SR, false);
// return prod; // return prod;
} }
@ -169,7 +175,7 @@ void DSPEmitter::clrp(const UDSPInstruction opc)
// g_dsp.r[DSP_REG_PRODM2] = 0x0010; // g_dsp.r[DSP_REG_PRODM2] = 0x0010;
//64bit move to memory does not work. use 2 32bits //64bit move to memory does not work. use 2 32bits
MOV(32, M(&g_dsp.r.prod.val), Imm32(0xfff00000U)); MOV(32, M(&g_dsp.r.prod.val), Imm32(0xfff00000U));
MOV(32, M((u8*)(&g_dsp.r.prod.val)+4), Imm32(0x001000ffU)); MOV(32, M(&g_dsp.r.prod.val+4), Imm32(0x001000ffU));
#else #else
Default(opc); Default(opc);
#endif #endif
@ -285,14 +291,16 @@ void DSPEmitter::addpaxz(const UDSPInstruction opc)
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
// s64 ax = dsp_get_long_acx(sreg); // s64 ax = dsp_get_long_acx(sreg);
get_long_acx(sreg, RCX); X64Reg tmp1;
MOV(64, R(RDI), R(RCX)); gpr.getFreeXReg(tmp1);
get_long_acx(sreg, tmp1);
MOV(64, R(RDX), R(tmp1));
// s64 res = prod + (ax & ~0xffff); // s64 res = prod + (ax & ~0xffff);
MOV(64, R(RDX), Imm64(~0xffff)); MOV(64, R(RAX), Imm64(~0xffff));
AND(64, R(RDI), R(RDX)); AND(64, R(RDX), R(RAX));
// s64 prod = dsp_get_long_prod_round_prodl(); // s64 prod = dsp_get_long_prod_round_prodl();
get_long_prod_round_prodl(); get_long_prod_round_prodl();
ADD(64, R(RAX), R(RDI)); ADD(64, R(RAX), R(RDX));
// s64 oldprod = dsp_get_long_prod(); // s64 oldprod = dsp_get_long_prod();
// dsp_set_long_acc(dreg, res); // dsp_set_long_acc(dreg, res);
@ -301,14 +309,15 @@ void DSPEmitter::addpaxz(const UDSPInstruction opc)
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
get_long_prod(RDX); get_long_prod(RDX);
MOV(64, R(RSI), R(RAX)); MOV(64, R(RCX), R(RAX));
set_long_acc(dreg, RSI); set_long_acc(dreg, RCX);
Update_SR_Register64_Carry(); Update_SR_Register64_Carry(EAX, tmp1);
} }
else else
{ {
set_long_acc(dreg, RAX); set_long_acc(dreg, RAX);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -323,8 +332,8 @@ void DSPEmitter::mulaxh(const UDSPInstruction opc)
{ {
#ifdef _M_X64 #ifdef _M_X64
// s64 prod = dsp_multiply(dsp_get_ax_h(0), dsp_get_ax_h(0)); // s64 prod = dsp_multiply(dsp_get_ax_h(0), dsp_get_ax_h(0));
dsp_op_read_reg(DSP_REG_AXH0, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXH0, RCX, SIGN);
MOV(64, R(RDI), R(RSI)); MOV(64, R(RAX), R(RCX));
multiply(); multiply();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
set_long_prod(); set_long_prod();
@ -345,9 +354,9 @@ void DSPEmitter::mul(const UDSPInstruction opc)
u8 sreg = (opc >> 11) & 0x1; u8 sreg = (opc >> 11) & 0x1;
// u16 axl = dsp_get_ax_l(sreg); // u16 axl = dsp_get_ax_l(sreg);
dsp_op_read_reg(DSP_REG_AXL0+sreg, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0+sreg, RCX, SIGN);
// u16 axh = dsp_get_ax_h(sreg); // u16 axh = dsp_get_ax_h(sreg);
dsp_op_read_reg(DSP_REG_AXH0+sreg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+sreg, RAX, SIGN);
// s64 prod = dsp_multiply(axh, axl); // s64 prod = dsp_multiply(axh, axl);
multiply(); multiply();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -377,9 +386,9 @@ void DSPEmitter::mulac(const UDSPInstruction opc)
ADD(64, R(RAX), R(RDX)); ADD(64, R(RAX), R(RDX));
PUSH(64, R(RAX)); PUSH(64, R(RAX));
// u16 axl = dsp_get_ax_l(sreg); // u16 axl = dsp_get_ax_l(sreg);
dsp_op_read_reg(DSP_REG_AXL0+sreg, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0+sreg, RCX, SIGN);
// u16 axh = dsp_get_ax_h(sreg); // u16 axh = dsp_get_ax_h(sreg);
dsp_op_read_reg(DSP_REG_AXH0+sreg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+sreg, RAX, SIGN);
// s64 prod = dsp_multiply(axl, axh); // s64 prod = dsp_multiply(axl, axh);
multiply(); multiply();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -467,9 +476,9 @@ void DSPEmitter::mulx(const UDSPInstruction opc)
u8 sreg = ((opc >> 12) & 0x1); u8 sreg = ((opc >> 12) & 0x1);
// u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0); // u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0);
dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RCX, SIGN);
// u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1); // u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1);
dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RAX, SIGN);
// s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2); // s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2);
multiply_mulx(sreg, treg); multiply_mulx(sreg, treg);
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -494,25 +503,28 @@ void DSPEmitter::mulxac(const UDSPInstruction opc)
u8 sreg = (opc >> 12) & 0x1; u8 sreg = (opc >> 12) & 0x1;
// s64 acc = dsp_get_long_acc(rreg) + dsp_get_long_prod(); // s64 acc = dsp_get_long_acc(rreg) + dsp_get_long_prod();
get_long_acc(rreg, RCX); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_long_acc(rreg, tmp1);
get_long_prod(); get_long_prod();
ADD(64, R(RCX), R(RAX)); ADD(64, R(tmp1), R(RAX));
// u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0); // u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0);
dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RCX, SIGN);
// u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1); // u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1);
dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RAX, SIGN);
// s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2); // s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2);
multiply_mulx(sreg, treg); multiply_mulx(sreg, treg);
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
set_long_prod(); set_long_prod();
// dsp_set_long_acc(rreg, acc); // dsp_set_long_acc(rreg, acc);
set_long_acc(rreg, RCX); set_long_acc(rreg, tmp1);
// Update_SR_Register64(dsp_get_long_acc(rreg)); // Update_SR_Register64(dsp_get_long_acc(rreg));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
Update_SR_Register64(RCX); Update_SR_Register64(tmp1);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -533,23 +545,26 @@ void DSPEmitter::mulxmv(const UDSPInstruction opc)
u8 sreg = (opc >> 12) & 0x1; u8 sreg = (opc >> 12) & 0x1;
// s64 acc = dsp_get_long_prod(); // s64 acc = dsp_get_long_prod();
get_long_prod(RCX); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_long_prod(tmp1);
// u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0); // u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0);
dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RCX, SIGN);
// u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1); // u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1);
dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RAX, SIGN);
// s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2); // s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2);
multiply_mulx(sreg, treg); multiply_mulx(sreg, treg);
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
set_long_prod(); set_long_prod();
// dsp_set_long_acc(rreg, acc); // dsp_set_long_acc(rreg, acc);
set_long_acc(rreg, RCX); set_long_acc(rreg, tmp1);
// Update_SR_Register64(dsp_get_long_acc(rreg)); // Update_SR_Register64(dsp_get_long_acc(rreg));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
Update_SR_Register64(RCX); Update_SR_Register64(tmp1);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -571,23 +586,26 @@ void DSPEmitter::mulxmvz(const UDSPInstruction opc)
u8 sreg = (opc >> 12) & 0x1; u8 sreg = (opc >> 12) & 0x1;
// s64 acc = dsp_get_long_prod_round_prodl(); // s64 acc = dsp_get_long_prod_round_prodl();
get_long_prod_round_prodl(RCX); X64Reg tmp1;
gpr.getFreeXReg(tmp1);
get_long_prod_round_prodl(tmp1);
// u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0); // u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0);
dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RCX, SIGN);
// u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1); // u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1);
dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RAX, SIGN);
// s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2); // s64 prod = dsp_multiply_mulx(sreg, treg, val1, val2);
multiply_mulx(sreg, treg); multiply_mulx(sreg, treg);
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
set_long_prod(); set_long_prod();
// dsp_set_long_acc(rreg, acc); // dsp_set_long_acc(rreg, acc);
set_long_acc(rreg, RCX); set_long_acc(rreg, tmp1);
// Update_SR_Register64(dsp_get_long_acc(rreg)); // Update_SR_Register64(dsp_get_long_acc(rreg));
if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR)) if (!(DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_START_OF_INST) || (DSPAnalyzer::code_flags[compilePC] & DSPAnalyzer::CODE_UPDATE_SR))
{ {
Update_SR_Register64(RCX); Update_SR_Register64(tmp1);
} }
gpr.putXReg(tmp1);
#else #else
Default(opc); Default(opc);
#endif #endif
@ -606,9 +624,9 @@ void DSPEmitter::mulc(const UDSPInstruction opc)
u8 sreg = (opc >> 12) & 0x1; u8 sreg = (opc >> 12) & 0x1;
// u16 accm = dsp_get_acc_m(sreg); // u16 accm = dsp_get_acc_m(sreg);
get_acc_m(sreg, ESI); get_acc_m(sreg, ECX);
// u16 axh = dsp_get_ax_h(treg); // u16 axh = dsp_get_ax_h(treg);
dsp_op_read_reg(DSP_REG_AXH0+treg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+treg, RAX, SIGN);
// s64 prod = dsp_multiply(accm, axh); // s64 prod = dsp_multiply(accm, axh);
multiply(); multiply();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -639,9 +657,9 @@ void DSPEmitter::mulcac(const UDSPInstruction opc)
ADD(64, R(RAX), R(RDX)); ADD(64, R(RAX), R(RDX));
PUSH(64, R(RAX)); PUSH(64, R(RAX));
// u16 accm = dsp_get_acc_m(sreg); // u16 accm = dsp_get_acc_m(sreg);
get_acc_m(sreg, ESI); get_acc_m(sreg, ECX);
// u16 axh = dsp_get_ax_h(treg); // u16 axh = dsp_get_ax_h(treg);
dsp_op_read_reg(DSP_REG_AXH0+treg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+treg, RAX, SIGN);
// s64 prod = dsp_multiply(accm, axh); // s64 prod = dsp_multiply(accm, axh);
multiply(); multiply();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -678,9 +696,9 @@ void DSPEmitter::mulcmv(const UDSPInstruction opc)
get_long_prod(); get_long_prod();
PUSH(64, R(RAX)); PUSH(64, R(RAX));
// u16 accm = dsp_get_acc_m(sreg); // u16 accm = dsp_get_acc_m(sreg);
get_acc_m(sreg, ESI); get_acc_m(sreg, ECX);
// u16 axh = dsp_get_ax_h(treg); // u16 axh = dsp_get_ax_h(treg);
dsp_op_read_reg(DSP_REG_AXH0+treg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+treg, RAX, SIGN);
// s64 prod = dsp_multiply(accm, axh); // s64 prod = dsp_multiply(accm, axh);
multiply(); multiply();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -718,9 +736,9 @@ void DSPEmitter::mulcmvz(const UDSPInstruction opc)
get_long_prod_round_prodl(); get_long_prod_round_prodl();
PUSH(64, R(RAX)); PUSH(64, R(RAX));
// u16 accm = dsp_get_acc_m(sreg); // u16 accm = dsp_get_acc_m(sreg);
get_acc_m(sreg, ESI); get_acc_m(sreg, ECX);
// u16 axh = dsp_get_ax_h(treg); // u16 axh = dsp_get_ax_h(treg);
dsp_op_read_reg(DSP_REG_AXH0+treg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+treg, RAX, SIGN);
// s64 prod = dsp_multiply(accm, axh); // s64 prod = dsp_multiply(accm, axh);
multiply(); multiply();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -752,9 +770,9 @@ void DSPEmitter::maddx(const UDSPInstruction opc)
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
// u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0); // u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0);
dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RCX, SIGN);
// u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1); // u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1);
dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RAX, SIGN);
// s64 prod = dsp_multiply_add(val1, val2); // s64 prod = dsp_multiply_add(val1, val2);
multiply_add(); multiply_add();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -776,9 +794,9 @@ void DSPEmitter::msubx(const UDSPInstruction opc)
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
// u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0); // u16 val1 = (sreg == 0) ? dsp_get_ax_l(0) : dsp_get_ax_h(0);
dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0 + sreg*2, RCX, SIGN);
// u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1); // u16 val2 = (treg == 0) ? dsp_get_ax_l(1) : dsp_get_ax_h(1);
dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXL1 + treg*2, RAX, SIGN);
// s64 prod = dsp_multiply_sub(val1, val2); // s64 prod = dsp_multiply_sub(val1, val2);
multiply_sub(); multiply_sub();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -800,9 +818,9 @@ void DSPEmitter::maddc(const UDSPInstruction opc)
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
// u16 accm = dsp_get_acc_m(sreg); // u16 accm = dsp_get_acc_m(sreg);
get_acc_m(sreg, ESI); get_acc_m(sreg, ECX);
// u16 axh = dsp_get_ax_h(treg); // u16 axh = dsp_get_ax_h(treg);
dsp_op_read_reg(DSP_REG_AXH0+treg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+treg, RAX, SIGN);
// s64 prod = dsp_multiply_add(accm, axh); // s64 prod = dsp_multiply_add(accm, axh);
multiply_add(); multiply_add();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -824,9 +842,9 @@ void DSPEmitter::msubc(const UDSPInstruction opc)
u8 sreg = (opc >> 9) & 0x1; u8 sreg = (opc >> 9) & 0x1;
// u16 accm = dsp_get_acc_m(sreg); // u16 accm = dsp_get_acc_m(sreg);
get_acc_m(sreg, ESI); get_acc_m(sreg, ECX);
// u16 axh = dsp_get_ax_h(treg); // u16 axh = dsp_get_ax_h(treg);
dsp_op_read_reg(DSP_REG_AXH0+treg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+treg, RAX, SIGN);
// s64 prod = dsp_multiply_sub(accm, axh); // s64 prod = dsp_multiply_sub(accm, axh);
multiply_sub(); multiply_sub();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -847,9 +865,9 @@ void DSPEmitter::madd(const UDSPInstruction opc)
u8 sreg = (opc >> 8) & 0x1; u8 sreg = (opc >> 8) & 0x1;
// u16 axl = dsp_get_ax_l(sreg); // u16 axl = dsp_get_ax_l(sreg);
dsp_op_read_reg(DSP_REG_AXL0+sreg, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0+sreg, RCX, SIGN);
// u16 axh = dsp_get_ax_h(sreg); // u16 axh = dsp_get_ax_h(sreg);
dsp_op_read_reg(DSP_REG_AXH0+sreg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+sreg, RAX, SIGN);
// s64 prod = dsp_multiply_add(axl, axh); // s64 prod = dsp_multiply_add(axl, axh);
multiply_add(); multiply_add();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);
@ -870,9 +888,9 @@ void DSPEmitter::msub(const UDSPInstruction opc)
u8 sreg = (opc >> 8) & 0x1; u8 sreg = (opc >> 8) & 0x1;
// u16 axl = dsp_get_ax_l(sreg); // u16 axl = dsp_get_ax_l(sreg);
dsp_op_read_reg(DSP_REG_AXL0+sreg, RSI, SIGN); dsp_op_read_reg(DSP_REG_AXL0+sreg, RCX, SIGN);
// u16 axh = dsp_get_ax_h(sreg); // u16 axh = dsp_get_ax_h(sreg);
dsp_op_read_reg(DSP_REG_AXH0+sreg, RDI, SIGN); dsp_op_read_reg(DSP_REG_AXH0+sreg, RAX, SIGN);
// s64 prod = dsp_multiply_sub(axl, axh); // s64 prod = dsp_multiply_sub(axl, axh);
multiply_sub(); multiply_sub();
// dsp_set_long_prod(prod); // dsp_set_long_prod(prod);

File diff suppressed because it is too large Load Diff

View File

@ -23,12 +23,16 @@
class DSPEmitter; class DSPEmitter;
enum DSPJitRegSpecial { enum DSPJitRegSpecial {
DSP_REG_ACC0_64 =32, DSP_REG_AX0_32 =32,
DSP_REG_ACC1_64 =33, DSP_REG_AX1_32 =33,
DSP_REG_AX0_32 =34, #ifdef _M_X64
DSP_REG_AX1_32 =35, DSP_REG_ACC0_64 =34,
DSP_REG_ACC1_64 =35,
DSP_REG_PROD_64 =36, DSP_REG_PROD_64 =36,
DSP_REG_MAX_MEM_BACKED = 36, DSP_REG_MAX_MEM_BACKED = 36,
#else
DSP_REG_MAX_MEM_BACKED = 33,
#endif
DSP_REG_USED =253, DSP_REG_USED =253,
DSP_REG_STATIC =254, DSP_REG_STATIC =254,
@ -50,24 +54,28 @@ private:
struct X64CachedReg struct X64CachedReg
{ {
int guest_reg; //including DSPJitRegSpecial int guest_reg; //including DSPJitRegSpecial
bool pushed;
}; };
struct DynamicReg { struct DynamicReg {
Gen::OpArg loc; Gen::OpArg loc;
void *mem; void *mem;
size_t size; size_t size;
bool dirty; bool dirty;
};
#ifdef _M_X64
//when there is a way to do this efficiently in x86, uncondition
struct {
Gen::X64Reg host_reg;
int shift;
bool dirty;
bool used; bool used;
Gen::X64Reg tmp_reg; int last_use_ctr;
} acc[2]; int parentReg;
#endif int shift;//current shift if parentReg == DSP_REG_NONE
//otherwise the shift this part can be found at
Gen::X64Reg host_reg;
/* todo:
+ drop sameReg
+ add parentReg
+ add shift:
- if parentReg != DSP_REG_NONE, this is the shift where this
register is found in the parentReg
- if parentReg == DSP_REG_NONE, this is the current shift _state_
*/
};
DynamicReg regs[DSP_REG_MAX_MEM_BACKED+1]; DynamicReg regs[DSP_REG_MAX_MEM_BACKED+1];
X64CachedReg xregs[NUMXREGS]; X64CachedReg xregs[NUMXREGS];
@ -75,11 +83,21 @@ private:
DSPEmitter &emitter; DSPEmitter &emitter;
bool temporary; bool temporary;
bool merged; bool merged;
int use_ctr;
private: private:
//find a free host reg //find a free host reg
Gen::X64Reg findFreeXReg(); Gen::X64Reg findFreeXReg();
Gen::X64Reg spillXReg(); Gen::X64Reg spillXReg();
Gen::X64Reg findSpillFreeXReg();
void spillXReg(Gen::X64Reg reg); void spillXReg(Gen::X64Reg reg);
void movToHostReg(int reg, Gen::X64Reg host_reg, bool load);
void movToHostReg(int reg, bool load);
void rotateHostReg(int reg, int shift, bool emit);
void movToMemory(int reg);
void flushMemBackedRegs();
public: public:
DSPJitRegCache(DSPEmitter &_emitter); DSPJitRegCache(DSPEmitter &_emitter);
@ -147,10 +165,19 @@ public:
//prepare state so that another flushed DSPJitRegCache can take over //prepare state so that another flushed DSPJitRegCache can take over
void flushRegs(); void flushRegs();
void loadStaticRegs();//load statically allocated regs from memory void loadRegs(bool emit=true);//load statically allocated regs from memory
void saveStaticRegs();//save statically allocated regs to memory void saveRegs();//save statically allocated regs to memory
void pushRegs();//save registers before abi call
void popRegs();//restore registers after abi call
//returns a register with the same contents as reg that is safe
//to use through saveStaticRegs and for ABI-calls
Gen::X64Reg makeABICallSafe(Gen::X64Reg reg);
//gives no SCALE_RIP with abs(offset) >= 0x80000000 //gives no SCALE_RIP with abs(offset) >= 0x80000000
//32/64 bit writes allowed when the register has a _64 or _32 suffix
//only 16 bit writes allowed without any suffix.
void getReg(int reg, Gen::OpArg &oparg, bool load = true); void getReg(int reg, Gen::OpArg &oparg, bool load = true);
//done with all usages of OpArg above //done with all usages of OpArg above
void putReg(int reg, bool dirty = true); void putReg(int reg, bool dirty = true);

View File

@ -36,32 +36,32 @@ using namespace Gen;
// EAX = g_dsp.r.ar[reg] // EAX = g_dsp.r.ar[reg]
// EDX = g_dsp.r.wr[reg] // EDX = g_dsp.r.wr[reg]
// EDI = temp
// ECX = temp
void DSPEmitter::increment_addr_reg(int reg) void DSPEmitter::increment_addr_reg(int reg)
{ {
OpArg ar_reg; OpArg ar_reg;
OpArg wr_reg; OpArg wr_reg;
gpr.getReg(DSP_REG_WR0+reg,wr_reg); gpr.getReg(DSP_REG_WR0+reg,wr_reg);
MOVZX(32, 16, EDX, wr_reg); MOVZX(32, 16, EDX, wr_reg);
gpr.putReg(DSP_REG_WR0+reg); gpr.putReg(DSP_REG_WR0+reg, false);
gpr.getReg(DSP_REG_AR0+reg,ar_reg); gpr.getReg(DSP_REG_AR0+reg,ar_reg);
MOVZX(32, 16, EAX, ar_reg); MOVZX(32, 16, EAX, ar_reg);
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
//u32 nar = ar + 1; //u32 nar = ar + 1;
MOV(32, R(EDI), R(EAX)); MOV(32, R(tmp1), R(EAX));
ADD(32, R(EAX), Imm8(1)); ADD(32, R(EAX), Imm8(1));
// if ((nar ^ ar) > ((wr | 1) << 1)) // if ((nar ^ ar) > ((wr | 1) << 1))
// nar -= wr + 1; // nar -= wr + 1;
XOR(32, R(EDI), R(EAX)); XOR(32, R(tmp1), R(EAX));
LEA(32, ECX, MComplex(EDX, EDX, 1, 0)); LEA(32, ECX, MRegSum(EDX, EDX));
OR(32, R(ECX), Imm8(2)); OR(32, R(ECX), Imm8(2));
CMP(32, R(EDI), R(ECX)); CMP(32, R(tmp1), R(ECX));
FixupBranch nowrap = J_CC(CC_BE); FixupBranch nowrap = J_CC(CC_BE);
SUB(16, R(AX), R(DX)); SUB(16, R(AX), R(DX));
SUB(16, R(AX), Imm8(1)); SUB(16, R(AX), Imm8(1));
SetJumpTarget(nowrap); SetJumpTarget(nowrap);
gpr.putXReg(tmp1);
// g_dsp.r.ar[reg] = nar; // g_dsp.r.ar[reg] = nar;
MOV(16, ar_reg, R(AX)); MOV(16, ar_reg, R(AX));
@ -70,171 +70,173 @@ void DSPEmitter::increment_addr_reg(int reg)
// EAX = g_dsp.r.ar[reg] // EAX = g_dsp.r.ar[reg]
// EDX = g_dsp.r.wr[reg] // EDX = g_dsp.r.wr[reg]
// EDI = temp
// ECX = temp
void DSPEmitter::decrement_addr_reg(int reg) void DSPEmitter::decrement_addr_reg(int reg)
{ {
OpArg ar_reg; OpArg ar_reg;
OpArg wr_reg; OpArg wr_reg;
gpr.getReg(DSP_REG_WR0+reg,wr_reg); gpr.getReg(DSP_REG_WR0+reg,wr_reg);
MOVZX(32, 16, EDX, wr_reg); MOVZX(32, 16, EDX, wr_reg);
gpr.putReg(DSP_REG_WR0+reg); gpr.putReg(DSP_REG_WR0+reg, false);
gpr.getReg(DSP_REG_AR0+reg,ar_reg); gpr.getReg(DSP_REG_AR0+reg,ar_reg);
MOVZX(32, 16, EAX, ar_reg); MOVZX(32, 16, EAX, ar_reg);
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
// u32 nar = ar + wr; // u32 nar = ar + wr;
// edi = nar // edi = nar
LEA(32, EDI, MComplex(EAX, EDX, 1, 0)); LEA(32, tmp1, MRegSum(EAX, EDX));
// if (((nar ^ ar) & ((wr | 1) << 1)) > wr) // if (((nar ^ ar) & ((wr | 1) << 1)) > wr)
// nar -= wr + 1; // nar -= wr + 1;
XOR(32, R(EAX), R(EDI)); XOR(32, R(EAX), R(tmp1));
LEA(32, ECX, MComplex(EDX, EDX, 1, 0)); LEA(32, ECX, MRegSum(EDX, EDX));
OR(32, R(ECX), Imm8(2)); OR(32, R(ECX), Imm8(2));
AND(32, R(EAX), R(ECX)); AND(32, R(EAX), R(ECX));
CMP(32, R(EAX), R(EDX)); CMP(32, R(EAX), R(EDX));
FixupBranch nowrap = J_CC(CC_BE); FixupBranch nowrap = J_CC(CC_BE);
SUB(16, R(DI), R(DX)); SUB(16, R(tmp1), R(DX));
SUB(16, R(DI), Imm8(1)); SUB(16, R(tmp1), Imm8(1));
SetJumpTarget(nowrap); SetJumpTarget(nowrap);
// g_dsp.r.ar[reg] = nar; // g_dsp.r.ar[reg] = nar;
MOV(16, ar_reg, R(DI)); MOV(16, ar_reg, R(tmp1));
gpr.putReg(DSP_REG_AR0+reg); gpr.putReg(DSP_REG_AR0+reg);
gpr.putXReg(tmp1);
} }
// Increase addr register according to the correspond ix register // Increase addr register according to the correspond ix register
// EAX = g_dsp.r.ar[reg] // EAX = g_dsp.r.ar[reg]
// EDX = g_dsp.r.wr[reg] // EDX = g_dsp.r.wr[reg]
// ESI = g_dsp.r.ix[reg] // ECX = g_dsp.r.ix[reg]
// ECX = temp void DSPEmitter::increase_addr_reg(int reg, int _ix_reg)
// EDI = temp {
void DSPEmitter::increase_addr_reg(int reg)
{
OpArg ar_reg; OpArg ar_reg;
OpArg wr_reg; OpArg wr_reg;
OpArg ix_reg; OpArg ix_reg;
gpr.getReg(DSP_REG_WR0+reg,wr_reg); gpr.getReg(DSP_REG_WR0+reg,wr_reg);
gpr.getReg(DSP_REG_IX0+reg,ix_reg);
MOVZX(32, 16, EDX, wr_reg); MOVZX(32, 16, EDX, wr_reg);
MOVSX(32, 16, ESI, ix_reg); gpr.putReg(DSP_REG_WR0+reg, false);
gpr.putReg(DSP_REG_WR0+reg); gpr.getReg(DSP_REG_IX0+_ix_reg,ix_reg);
gpr.putReg(DSP_REG_IX0+reg); MOVSX(32, 16, ECX, ix_reg);
gpr.putReg(DSP_REG_IX0+_ix_reg, false);
gpr.getReg(DSP_REG_AR0+reg,ar_reg); gpr.getReg(DSP_REG_AR0+reg,ar_reg);
MOVZX(32, 16, EAX, ar_reg); MOVZX(32, 16, EAX, ar_reg);
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
//u32 nar = ar + ix; //u32 nar = ar + ix;
//edi = nar //edi = nar
LEA(32, EDI, MComplex(EAX, ESI, 1, 0)); LEA(32, tmp1, MRegSum(EAX, ECX));
//u32 dar = (nar ^ ar ^ ix) & ((wr | 1) << 1); //u32 dar = (nar ^ ar ^ ix) & ((wr | 1) << 1);
//eax = dar //eax = dar
XOR(32, R(EAX), R(ESI)); XOR(32, R(EAX), R(ECX));
XOR(32, R(EAX), R(EDI)); XOR(32, R(EAX), R(tmp1));
LEA(32, ECX, MComplex(EDX, EDX, 1, 0)); LEA(32, ECX, MRegSum(EDX, EDX));
OR(32, R(ECX), Imm8(2)); OR(32, R(ECX), Imm8(2));
AND(32, R(EAX), R(ECX)); AND(32, R(EAX), R(ECX));
//if (ix >= 0) //if (ix >= 0)
TEST(32, R(ESI), R(ESI)); TEST(32, R(ECX), R(ECX));
FixupBranch negative = J_CC(CC_S); FixupBranch negative = J_CC(CC_S);
//if (dar > wr) //if (dar > wr)
CMP(32, R(EAX), R(EDX)); CMP(32, R(EAX), R(EDX));
FixupBranch done = J_CC(CC_BE); FixupBranch done = J_CC(CC_BE);
//nar -= wr + 1; //nar -= wr + 1;
SUB(16, R(DI), R(DX)); SUB(16, R(tmp1), R(DX));
SUB(16, R(DI), Imm8(1)); SUB(16, R(tmp1), Imm8(1));
FixupBranch done2 = J(); FixupBranch done2 = J();
//else //else
SetJumpTarget(negative); SetJumpTarget(negative);
//if ((((nar + wr + 1) ^ nar) & dar) <= wr) //if ((((nar + wr + 1) ^ nar) & dar) <= wr)
LEA(32, ECX, MComplex(EDI, EDX, 1, 1)); LEA(32, ECX, MComplex(tmp1, EDX, 1, 1));
XOR(32, R(ECX), R(EDI)); XOR(32, R(ECX), R(tmp1));
AND(32, R(ECX), R(EAX)); AND(32, R(ECX), R(EAX));
CMP(32, R(ECX), R(EDX)); CMP(32, R(ECX), R(EDX));
FixupBranch done3 = J_CC(CC_A); FixupBranch done3 = J_CC(CC_A);
//nar += wr + 1; //nar += wr + 1;
LEA(32, EDI, MComplex(EDI, EDX, 1, 1)); LEA(32, tmp1, MComplex(tmp1, EDX, 1, 1));
SetJumpTarget(done); SetJumpTarget(done);
SetJumpTarget(done2); SetJumpTarget(done2);
SetJumpTarget(done3); SetJumpTarget(done3);
// g_dsp.r.ar[reg] = nar; // g_dsp.r.ar[reg] = nar;
MOV(16, ar_reg, R(DI)); MOV(16, ar_reg, R(tmp1));
gpr.putReg(DSP_REG_AR0+reg); gpr.putReg(DSP_REG_AR0+reg);
gpr.putXReg(tmp1);
} }
// Decrease addr register according to the correspond ix register // Decrease addr register according to the correspond ix register
// EAX = g_dsp.r.ar[reg] // EAX = g_dsp.r.ar[reg]
// EDX = g_dsp.r.wr[reg] // EDX = g_dsp.r.wr[reg]
// ESI = g_dsp.r.ix[reg] // ECX = g_dsp.r.ix[reg]
// ECX = temp
// EDI = temp
void DSPEmitter::decrease_addr_reg(int reg) void DSPEmitter::decrease_addr_reg(int reg)
{ {
OpArg ar_reg; OpArg ar_reg;
OpArg wr_reg; OpArg wr_reg;
OpArg ix_reg; OpArg ix_reg;
gpr.getReg(DSP_REG_WR0+reg,wr_reg); gpr.getReg(DSP_REG_WR0+reg,wr_reg);
gpr.getReg(DSP_REG_IX0+reg,ix_reg);
MOVZX(32, 16, EDX, wr_reg); MOVZX(32, 16, EDX, wr_reg);
MOVSX(32, 16, ESI, ix_reg); gpr.putReg(DSP_REG_WR0+reg, false);
gpr.putReg(DSP_REG_WR0+reg); gpr.getReg(DSP_REG_IX0+reg,ix_reg);
gpr.putReg(DSP_REG_IX0+reg); MOVSX(32, 16, ECX, ix_reg);
gpr.putReg(DSP_REG_IX0+reg, false);
gpr.getReg(DSP_REG_AR0+reg,ar_reg); gpr.getReg(DSP_REG_AR0+reg,ar_reg);
MOVZX(32, 16, EAX, ar_reg); MOVZX(32, 16, EAX, ar_reg);
NOT(32, R(ESI)); //esi = ~ix NOT(32, R(ECX)); //esi = ~ix
X64Reg tmp1;
gpr.getFreeXReg(tmp1);
//u32 nar = ar - ix; (ar + ~ix + 1) //u32 nar = ar - ix; (ar + ~ix + 1)
LEA(32, EDI, MComplex(EAX, ESI, 1, 1)); LEA(32, tmp1, MComplex(EAX, ECX, 1, 1));
//u32 dar = (nar ^ ar ^ ~ix) & ((wr | 1) << 1); //u32 dar = (nar ^ ar ^ ~ix) & ((wr | 1) << 1);
//eax = dar //eax = dar
XOR(32, R(EAX), R(ESI)); XOR(32, R(EAX), R(ECX));
XOR(32, R(EAX), R(EDI)); XOR(32, R(EAX), R(tmp1));
LEA(32, ECX, MComplex(EDX, EDX, 1, 0)); LEA(32, ECX, MRegSum(EDX, EDX));
OR(32, R(ECX), Imm8(2)); OR(32, R(ECX), Imm8(2));
AND(32, R(EAX), R(ECX)); AND(32, R(EAX), R(ECX));
//if ((u32)ix > 0xFFFF8000) ==> (~ix < 0x00007FFF) //if ((u32)ix > 0xFFFF8000) ==> (~ix < 0x00007FFF)
CMP(32, R(ESI), Imm32(0x00007FFF)); CMP(32, R(ECX), Imm32(0x00007FFF));
FixupBranch positive = J_CC(CC_AE); FixupBranch positive = J_CC(CC_AE);
//if (dar > wr) //if (dar > wr)
CMP(32, R(EAX), R(EDX)); CMP(32, R(EAX), R(EDX));
FixupBranch done = J_CC(CC_BE); FixupBranch done = J_CC(CC_BE);
//nar -= wr + 1; //nar -= wr + 1;
SUB(16, R(DI), R(DX)); SUB(16, R(tmp1), R(DX));
SUB(16, R(DI), Imm8(1)); SUB(16, R(tmp1), Imm8(1));
FixupBranch done2 = J(); FixupBranch done2 = J();
//else //else
SetJumpTarget(positive); SetJumpTarget(positive);
//if ((((nar + wr + 1) ^ nar) & dar) <= wr) //if ((((nar + wr + 1) ^ nar) & dar) <= wr)
LEA(32, ECX, MComplex(EDI, EDX, 1, 1)); LEA(32, ECX, MComplex(tmp1, EDX, 1, 1));
XOR(32, R(ECX), R(EDI)); XOR(32, R(ECX), R(tmp1));
AND(32, R(ECX), R(EAX)); AND(32, R(ECX), R(EAX));
CMP(32, R(ECX), R(EDX)); CMP(32, R(ECX), R(EDX));
FixupBranch done3 = J_CC(CC_A); FixupBranch done3 = J_CC(CC_A);
//nar += wr + 1; //nar += wr + 1;
LEA(32, EDI, MComplex(EDI, EDX, 1, 1)); LEA(32, tmp1, MComplex(tmp1, EDX, 1, 1));
SetJumpTarget(done); SetJumpTarget(done);
SetJumpTarget(done2); SetJumpTarget(done2);
SetJumpTarget(done3); SetJumpTarget(done3);
//return nar //return nar
MOV(16, ar_reg, R(DI)); MOV(16, ar_reg, R(tmp1));
gpr.putReg(DSP_REG_AR0+reg); gpr.putReg(DSP_REG_AR0+reg);
gpr.putXReg(tmp1);
} }
// EAX - destination address // EAX - destination address
// ECX - value // ECX - Base of dram
// ESI - Base of dram void DSPEmitter::dmem_write(X64Reg value)
void DSPEmitter::dmem_write()
{ {
// if (saddr == 0) // if (saddr == 0)
CMP(16, R(EAX), Imm16(0x0fff)); CMP(16, R(EAX), Imm16(0x0fff));
@ -243,45 +245,47 @@ void DSPEmitter::dmem_write()
// g_dsp.dram[addr & DSP_DRAM_MASK] = val; // g_dsp.dram[addr & DSP_DRAM_MASK] = val;
AND(16, R(EAX), Imm16(DSP_DRAM_MASK)); AND(16, R(EAX), Imm16(DSP_DRAM_MASK));
#ifdef _M_X64 #ifdef _M_X64
MOV(64, R(ESI), ImmPtr(g_dsp.dram)); MOV(64, R(ECX), ImmPtr(g_dsp.dram));
#else #else
MOV(32, R(ESI), ImmPtr(g_dsp.dram)); MOV(32, R(ECX), ImmPtr(g_dsp.dram));
#endif #endif
MOV(16, MComplex(ESI, EAX, 2, 0), R(ECX)); MOV(16, MComplex(ECX, EAX, 2, 0), R(value));
FixupBranch end = J(); FixupBranch end = J(true);
// else if (saddr == 0xf) // else if (saddr == 0xf)
SetJumpTarget(ifx); SetJumpTarget(ifx);
// Does it mean gdsp_ifx_write needs u32 rather than u16? // Does it mean gdsp_ifx_write needs u32 rather than u16?
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
SaveDSPRegs(); X64Reg abisafereg = gpr.makeABICallSafe(value);
ABI_CallFunctionRR((void *)gdsp_ifx_write, EAX, ECX); gpr.pushRegs();
LoadDSPRegs(); ABI_CallFunctionRR((void *)gdsp_ifx_write, EAX, abisafereg);
gpr.popRegs();
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(end); SetJumpTarget(end);
} }
// ECX - value void DSPEmitter::dmem_write_imm(u16 address, X64Reg value)
void DSPEmitter::dmem_write_imm(u16 address)
{ {
switch (address >> 12) switch (address >> 12)
{ {
case 0x0: // 0xxx DRAM case 0x0: // 0xxx DRAM
#ifdef _M_IX86 // All32 #ifdef _M_IX86 // All32
MOV(16, M(&g_dsp.dram[address & DSP_DRAM_MASK]), R(ECX)); MOV(16, M(&g_dsp.dram[address & DSP_DRAM_MASK]), R(value));
#else #else
MOV(64, R(RDX), ImmPtr(g_dsp.dram)); MOV(64, R(RDX), ImmPtr(g_dsp.dram));
MOV(16, MDisp(RDX, (address & DSP_DRAM_MASK)*2), R(ECX)); MOV(16, MDisp(RDX, (address & DSP_DRAM_MASK)*2), R(value));
#endif #endif
break; break;
case 0xf: // Fxxx HW regs case 0xf: // Fxxx HW regs
{
MOV(16, R(EAX), Imm16(address)); MOV(16, R(EAX), Imm16(address));
SaveDSPRegs(); X64Reg abisafereg = gpr.makeABICallSafe(value);
ABI_CallFunctionRR((void *)gdsp_ifx_write, EAX, ECX); gpr.pushRegs();
LoadDSPRegs(); ABI_CallFunctionRR((void *)gdsp_ifx_write, EAX, abisafereg);
gpr.popRegs();
break; break;
}
default: // Unmapped/non-existing memory default: // Unmapped/non-existing memory
ERROR_LOG(DSPLLE, "%04x DSP ERROR: Write to UNKNOWN (%04x) memory", ERROR_LOG(DSPLLE, "%04x DSP ERROR: Write to UNKNOWN (%04x) memory",
g_dsp.pc, address); g_dsp.pc, address);
@ -289,81 +293,80 @@ void DSPEmitter::dmem_write_imm(u16 address)
} }
} }
// In: ECX - the address to read // In: (address) - the address to read
// Out: EAX - the result of the read (used by caller) // Out: EAX - the result of the read (used by caller)
// ESI - Base // ECX - Base
void DSPEmitter::imem_read() void DSPEmitter::imem_read(X64Reg address)
{ {
// if (addr == 0) // if (addr == 0)
CMP(16, R(ECX), Imm16(0x0fff)); CMP(16, R(address), Imm16(0x0fff));
FixupBranch irom = J_CC(CC_A); FixupBranch irom = J_CC(CC_A);
// return g_dsp.iram[addr & DSP_IRAM_MASK]; // return g_dsp.iram[addr & DSP_IRAM_MASK];
AND(16, R(ECX), Imm16(DSP_IRAM_MASK)); AND(16, R(address), Imm16(DSP_IRAM_MASK));
#ifdef _M_X64 #ifdef _M_X64
MOV(64, R(ESI), ImmPtr(g_dsp.iram)); MOV(64, R(ECX), ImmPtr(g_dsp.iram));
#else #else
MOV(32, R(ESI), ImmPtr(g_dsp.iram)); MOV(32, R(ECX), ImmPtr(g_dsp.iram));
#endif #endif
MOV(16, R(EAX), MComplex(ESI, ECX, 2, 0)); MOV(16, R(EAX), MComplex(ECX, address, 2, 0));
FixupBranch end = J(); FixupBranch end = J();
SetJumpTarget(irom); SetJumpTarget(irom);
// else if (addr == 0x8) // else if (addr == 0x8)
// return g_dsp.irom[addr & DSP_IROM_MASK]; // return g_dsp.irom[addr & DSP_IROM_MASK];
AND(16, R(ECX), Imm16(DSP_IROM_MASK)); AND(16, R(address), Imm16(DSP_IROM_MASK));
#ifdef _M_X64 #ifdef _M_X64
MOV(64, R(ESI), ImmPtr(g_dsp.irom)); MOV(64, R(ECX), ImmPtr(g_dsp.irom));
#else #else
MOV(32, R(ESI), ImmPtr(g_dsp.irom)); MOV(32, R(ECX), ImmPtr(g_dsp.irom));
#endif #endif
MOV(16, R(EAX), MComplex(ESI, ECX, 2, 0)); MOV(16, R(EAX), MComplex(ECX, address, 2, 0));
SetJumpTarget(end); SetJumpTarget(end);
} }
// In: ECX - the address to read // In: (address) - the address to read
// Out: EAX - the result of the read (used by caller) // Out: EAX - the result of the read (used by caller)
// ESI - Base // ECX - Base
void DSPEmitter::dmem_read() void DSPEmitter::dmem_read(X64Reg address)
{ {
// if (saddr == 0) // if (saddr == 0)
CMP(16, R(ECX), Imm16(0x0fff)); CMP(16, R(address), Imm16(0x0fff));
FixupBranch dram = J_CC(CC_A); FixupBranch dram = J_CC(CC_A);
// return g_dsp.dram[addr & DSP_DRAM_MASK]; // return g_dsp.dram[addr & DSP_DRAM_MASK];
AND(32, R(address), Imm32(DSP_DRAM_MASK));
#ifdef _M_X64 #ifdef _M_X64
AND(16, R(ECX), Imm16(DSP_DRAM_MASK)); MOVZX(64, 16, address, R(address));
MOVZX(64, 16, RCX, R(RCX)); MOV(64, R(ECX), ImmPtr(g_dsp.dram));
MOV(64, R(ESI), ImmPtr(g_dsp.dram));
#else #else
AND(32, R(ECX), Imm32(DSP_DRAM_MASK)); MOV(32, R(ECX), ImmPtr(g_dsp.dram));
MOV(32, R(ESI), ImmPtr(g_dsp.dram));
#endif #endif
MOV(16, R(EAX), MComplex(ESI, ECX, 2, 0)); MOV(16, R(EAX), MComplex(ECX, address, 2, 0));
FixupBranch end = J(); FixupBranch end = J(true);
SetJumpTarget(dram); SetJumpTarget(dram);
// else if (saddr == 0x1) // else if (saddr == 0x1)
CMP(16, R(ECX), Imm16(0x1fff)); CMP(16, R(address), Imm16(0x1fff));
FixupBranch ifx = J_CC(CC_A); FixupBranch ifx = J_CC(CC_A);
// return g_dsp.coef[addr & DSP_COEF_MASK]; // return g_dsp.coef[addr & DSP_COEF_MASK];
AND(32, R(address), Imm32(DSP_COEF_MASK));
#ifdef _M_X64 #ifdef _M_X64
AND(16, R(ECX), Imm16(DSP_COEF_MASK)); MOVZX(64, 16, address, R(address));
MOVZX(64, 16, RCX, R(RCX)); MOV(64, R(ECX), ImmPtr(g_dsp.coef));
MOV(64, R(ESI), ImmPtr(g_dsp.coef));
#else #else
AND(32, R(ECX), Imm32(DSP_COEF_MASK)); MOV(32, R(ECX), ImmPtr(g_dsp.coef));
MOV(32, R(ESI), ImmPtr(g_dsp.coef));
#endif #endif
MOV(16, R(EAX), MComplex(ESI, ECX, 2, 0)); MOV(16, R(EAX), MComplex(ECX, address, 2, 0));
FixupBranch end2 = J(); FixupBranch end2 = J(true);
SetJumpTarget(ifx); SetJumpTarget(ifx);
// else if (saddr == 0xf) // else if (saddr == 0xf)
// return gdsp_ifx_read(addr); // return gdsp_ifx_read(addr);
DSPJitRegCache c(gpr); DSPJitRegCache c(gpr);
SaveDSPRegs(); X64Reg abisafereg = gpr.makeABICallSafe(address);
ABI_CallFunctionR((void *)gdsp_ifx_read, ECX); gpr.pushRegs();
LoadDSPRegs(); ABI_CallFunctionR((void *)gdsp_ifx_read, abisafereg);
gpr.popRegs();
gpr.flushRegs(c); gpr.flushRegs(c);
SetJumpTarget(end); SetJumpTarget(end);
SetJumpTarget(end2); SetJumpTarget(end2);
@ -392,11 +395,12 @@ void DSPEmitter::dmem_read_imm(u16 address)
break; break;
case 0xf: // Fxxx HW regs case 0xf: // Fxxx HW regs
SaveDSPRegs(); {
gpr.pushRegs();
ABI_CallFunctionC16((void *)gdsp_ifx_read, address); ABI_CallFunctionC16((void *)gdsp_ifx_read, address);
LoadDSPRegs(); gpr.popRegs();
break; break;
}
default: // Unmapped/non-existing memory default: // Unmapped/non-existing memory
ERROR_LOG(DSPLLE, "%04x DSP ERROR: Read from UNKNOWN (%04x) memory", ERROR_LOG(DSPLLE, "%04x DSP ERROR: Read from UNKNOWN (%04x) memory",
g_dsp.pc, address); g_dsp.pc, address);
@ -408,11 +412,13 @@ void DSPEmitter::get_long_prod(X64Reg long_prod)
{ {
#ifdef _M_X64 #ifdef _M_X64
//s64 val = (s8)(u8)g_dsp.r[DSP_REG_PRODH]; //s64 val = (s8)(u8)g_dsp.r[DSP_REG_PRODH];
OpArg reg; OpArg prod_reg;
gpr.getReg(DSP_REG_PROD_64, reg); gpr.getReg(DSP_REG_PROD_64, prod_reg);
MOV(64, R(long_prod), prod_reg);
gpr.putReg(DSP_REG_PROD_64, false);
//no use in keeping prod_reg any longer.
X64Reg tmp; X64Reg tmp;
gpr.getFreeXReg(tmp); gpr.getFreeXReg(tmp);
MOV(64, R(long_prod), reg);
MOV(64, R(tmp), R(long_prod)); MOV(64, R(tmp), R(long_prod));
SHL(64, R(long_prod), Imm8(64-40));//sign extend SHL(64, R(long_prod), Imm8(64-40));//sign extend
SAR(64, R(long_prod), Imm8(64-40)); SAR(64, R(long_prod), Imm8(64-40));
@ -420,33 +426,35 @@ void DSPEmitter::get_long_prod(X64Reg long_prod)
SHL(64, R(tmp), Imm8(16)); SHL(64, R(tmp), Imm8(16));
ADD(64, R(long_prod), R(tmp)); ADD(64, R(long_prod), R(tmp));
gpr.putXReg(tmp); gpr.putXReg(tmp);
gpr.putReg(DSP_REG_PROD_64, false);
#endif #endif
} }
// Returns s64 in RAX // Returns s64 in RAX
// Clobbers RSI // Clobbers RCX
void DSPEmitter::get_long_prod_round_prodl(X64Reg long_prod) void DSPEmitter::get_long_prod_round_prodl(X64Reg long_prod)
{ {
#ifdef _M_X64 #ifdef _M_X64
//s64 prod = dsp_get_long_prod(); //s64 prod = dsp_get_long_prod();
get_long_prod(long_prod); get_long_prod(long_prod);
X64Reg tmp;
gpr.getFreeXReg(tmp);
//if (prod & 0x10000) prod = (prod + 0x8000) & ~0xffff; //if (prod & 0x10000) prod = (prod + 0x8000) & ~0xffff;
TEST(32, R(long_prod), Imm32(0x10000)); TEST(32, R(long_prod), Imm32(0x10000));
FixupBranch jump = J_CC(CC_Z); FixupBranch jump = J_CC(CC_Z);
ADD(64, R(long_prod), Imm32(0x8000)); ADD(64, R(long_prod), Imm32(0x8000));
MOV(64, R(ESI), Imm64(~0xffff)); MOV(64, R(tmp), Imm64(~0xffff));
AND(64, R(long_prod), R(RSI)); AND(64, R(long_prod), R(tmp));
FixupBranch _ret = J(); FixupBranch _ret = J();
//else prod = (prod + 0x7fff) & ~0xffff; //else prod = (prod + 0x7fff) & ~0xffff;
SetJumpTarget(jump); SetJumpTarget(jump);
ADD(64, R(long_prod), Imm32(0x7fff)); ADD(64, R(long_prod), Imm32(0x7fff));
MOV(64, R(RSI), Imm64(~0xffff)); MOV(64, R(tmp), Imm64(~0xffff));
AND(64, R(long_prod), R(RSI)); AND(64, R(long_prod), R(tmp));
SetJumpTarget(_ret); SetJumpTarget(_ret);
//return prod; //return prod;
gpr.putXReg(tmp);
#endif #endif
} }
@ -456,23 +464,23 @@ void DSPEmitter::get_long_prod_round_prodl(X64Reg long_prod)
void DSPEmitter::set_long_prod() void DSPEmitter::set_long_prod()
{ {
#ifdef _M_X64 #ifdef _M_X64
OpArg reg;
gpr.getReg(DSP_REG_PROD_64, reg, false);
X64Reg tmp; X64Reg tmp;
gpr.getFreeXReg(tmp); gpr.getFreeXReg(tmp);
MOV(64, R(tmp), Imm64(0x000000ffffffffffULL)); MOV(64, R(tmp), Imm64(0x000000ffffffffffULL));
AND(64, R(RAX), R(tmp)); AND(64, R(RAX), R(tmp));
// g_dsp.r[DSP_REG_PRODL] = (u16)val;
MOV(64, reg, R(RAX));
gpr.putXReg(tmp); gpr.putXReg(tmp);
OpArg prod_reg;
gpr.getReg(DSP_REG_PROD_64, prod_reg, false);
// g_dsp.r[DSP_REG_PRODL] = (u16)val;
MOV(64, prod_reg, R(RAX));
gpr.putReg(DSP_REG_PROD_64, true); gpr.putReg(DSP_REG_PROD_64, true);
#endif #endif
} }
// Returns s64 in RAX // Returns s64 in RAX
// Clobbers RSI // Clobbers RCX
void DSPEmitter::round_long_acc(X64Reg long_acc) void DSPEmitter::round_long_acc(X64Reg long_acc)
{ {
#ifdef _M_X64 #ifdef _M_X64
@ -480,14 +488,14 @@ void DSPEmitter::round_long_acc(X64Reg long_acc)
TEST(32, R(long_acc), Imm32(0x10000)); TEST(32, R(long_acc), Imm32(0x10000));
FixupBranch jump = J_CC(CC_Z); FixupBranch jump = J_CC(CC_Z);
ADD(64, R(long_acc), Imm32(0x8000)); ADD(64, R(long_acc), Imm32(0x8000));
MOV(64, R(ESI), Imm64(~0xffff)); MOV(64, R(ECX), Imm64(~0xffff));
AND(64, R(long_acc), R(RSI)); AND(64, R(long_acc), R(RCX));
FixupBranch _ret = J(); FixupBranch _ret = J();
//else prod = (prod + 0x7fff) & ~0xffff; //else prod = (prod + 0x7fff) & ~0xffff;
SetJumpTarget(jump); SetJumpTarget(jump);
ADD(64, R(long_acc), Imm32(0x7fff)); ADD(64, R(long_acc), Imm32(0x7fff));
MOV(64, R(RSI), Imm64(~0xffff)); MOV(64, R(RCX), Imm64(~0xffff));
AND(64, R(long_acc), R(RSI)); AND(64, R(long_acc), R(RCX));
SetJumpTarget(_ret); SetJumpTarget(_ret);
//return prod; //return prod;
#endif #endif
@ -577,15 +585,5 @@ void DSPEmitter::get_ax_h(int _reg, X64Reg axh)
gpr.readReg(_reg+DSP_REG_AXH0, axh, SIGN); gpr.readReg(_reg+DSP_REG_AXH0, axh, SIGN);
} }
void DSPEmitter::LoadDSPRegs()
{
// Load DSP register state here...
gpr.loadStaticRegs();
}
void DSPEmitter::SaveDSPRegs()
{
// Save DSP register state here...
gpr.saveStaticRegs();
}