// Copyright (c) 2012- PPSSPP Project. // This program is free software: you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation, version 2.0 or later versions. // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License 2.0 for more details. // A copy of the GPL 2.0 should have been included with the program. // If not, see http://www.gnu.org/licenses/ // Official git repository and contact information can be found at // https://github.com/hrydgard/ppsspp and http://www.ppsspp.org/. #include "../MIPS.h" #include "../../Config.h" #include "Common/Common.h" #include "Jit.h" #include "RegCache.h" #define _RS ((op>>21) & 0x1F) #define _RT ((op>>16) & 0x1F) #define _RD ((op>>11) & 0x1F) #define _FS ((op>>11) & 0x1F) #define _FT ((op>>16) & 0x1F) #define _FD ((op>>6 ) & 0x1F) #define _POS ((op>>6 ) & 0x1F) #define _SIZE ((op>>11 ) & 0x1F) // All functions should have CONDITIONAL_DISABLE, so we can narrow things down to a file quickly. // Currently known non working ones should have DISABLE. // #define CONDITIONAL_DISABLE { Comp_Generic(op); return; } #define CONDITIONAL_DISABLE ; #define DISABLE { Comp_Generic(op); return; } namespace MIPSComp { void Jit::CompFPTriArith(u32 op, void (XEmitter::*arith)(X64Reg reg, OpArg), bool orderMatters) { int ft = _FT; int fs = _FS; int fd = _FD; fpr.SpillLock(fd, fs, ft); if (fs == fd) { fpr.BindToRegister(fd, true, true); (this->*arith)(fpr.RX(fd), fpr.R(ft)); } else if (ft == fd && !orderMatters) { fpr.BindToRegister(fd, true, true); (this->*arith)(fpr.RX(fd), fpr.R(fs)); } else if (ft != fd && fs != fd && ft != fs) { fpr.BindToRegister(fd, false, true); MOVSS(fpr.RX(fd), fpr.R(fs)); (this->*arith)(fpr.RX(fd), fpr.R(ft)); } else { fpr.BindToRegister(fd, true, true); MOVSS(XMM0, fpr.R(fs)); (this->*arith)(XMM0, fpr.R(ft)); MOVSS(fpr.RX(fd), R(XMM0)); } fpr.ReleaseSpillLocks(); } void Jit::Comp_FPU3op(u32 op) { CONDITIONAL_DISABLE; switch (op & 0x3f) { case 0: CompFPTriArith(op, &XEmitter::ADDSS, false); break; //F(fd) = F(fs) + F(ft); //add case 1: CompFPTriArith(op, &XEmitter::SUBSS, true); break; //F(fd) = F(fs) - F(ft); //sub case 2: CompFPTriArith(op, &XEmitter::MULSS, false); break; //F(fd) = F(fs) * F(ft); //mul case 3: CompFPTriArith(op, &XEmitter::DIVSS, true); break; //F(fd) = F(fs) / F(ft); //div default: _dbg_assert_msg_(CPU,0,"Trying to compile FPU3Op instruction that can't be interpreted"); break; } } static u32 GC_ALIGNED16(ssLoadStoreTemp); void Jit::Comp_FPULS(u32 op) { CONDITIONAL_DISABLE; s32 offset = (s16)(op&0xFFFF); int ft = _FT; int rs = _RS; switch(op >> 26) { case 49: //FI(ft) = Memory::Read_U32(addr); break; //lwc1 { gpr.Lock(rs); fpr.SpillLock(ft); fpr.BindToRegister(ft, false, true); JitSafeMem safe(this, rs, offset); OpArg src; if (safe.PrepareRead(src, 4)) MOVSS(fpr.RX(ft), src); if (safe.PrepareSlowRead((void *) &Memory::Read_U32)) { MOV(32, M((void *)&ssLoadStoreTemp), R(EAX)); MOVSS(fpr.RX(ft), M((void *)&ssLoadStoreTemp)); } safe.Finish(); gpr.UnlockAll(); fpr.ReleaseSpillLocks(); } break; case 57: //Memory::Write_U32(FI(ft), addr); break; //swc1 { gpr.Lock(rs); fpr.SpillLock(ft); fpr.BindToRegister(ft, true, false); JitSafeMem safe(this, rs, offset); OpArg dest; if (safe.PrepareWrite(dest, 4)) MOVSS(dest, fpr.RX(ft)); if (safe.PrepareSlowWrite()) { MOVSS(M((void *)&ssLoadStoreTemp), fpr.RX(ft)); safe.DoSlowWrite((void *) &Memory::Write_U32, M((void *)&ssLoadStoreTemp)); } safe.Finish(); gpr.UnlockAll(); fpr.ReleaseSpillLocks(); } break; default: _dbg_assert_msg_(CPU,0,"Trying to interpret FPULS instruction that can't be interpreted"); break; } } static const u64 GC_ALIGNED16(ssOneBits[2]) = {0x0000000100000001ULL, 0x0000000100000001ULL}; static const u64 GC_ALIGNED16(ssSignBits2[2]) = {0x8000000080000000ULL, 0x8000000080000000ULL}; static const u64 GC_ALIGNED16(ssNoSignMask[2]) = {0x7FFFFFFF7FFFFFFFULL, 0x7FFFFFFF7FFFFFFFULL}; static u32 ssCompareTemp; enum { CMPEQSS = 0, CMPLTSS = 1, CMPLESS = 2, CMPUNORDSS = 3, CMPNEQSS = 4, CMPNLTSS = 5, CMPNLESS = 6, CMPORDSS = 7, }; void Jit::CompFPComp(int lhs, int rhs, u8 compare, bool allowNaN) { MOVSS(XMM0, fpr.R(lhs)); CMPSS(XMM0, fpr.R(rhs), compare); MOVSS(M((void *) ¤tMIPS->fpcond), XMM0); // This means that NaN also means true, e.g. !<> or !>, etc. if (allowNaN) { MOVSS(XMM0, fpr.R(lhs)); CMPSS(XMM0, fpr.R(rhs), CMPUNORDSS); MOVSS(M((void *) &ssCompareTemp), XMM0); MOV(32, R(EAX), M((void *) &ssCompareTemp)); OR(32, M((void *) ¤tMIPS->fpcond), R(EAX)); } } void Jit::Comp_FPUComp(u32 op) { CONDITIONAL_DISABLE; int fs = _FS; int ft = _FT; switch (op & 0xf) { case 0: //f case 8: //sf MOV(32, M((void *) ¤tMIPS->fpcond), Imm32(0)); break; case 1: //un case 9: //ngle CompFPComp(fs, ft, CMPUNORDSS); break; case 2: //eq case 10: //seq CompFPComp(fs, ft, CMPEQSS); break; case 3: //ueq case 11: //ngl CompFPComp(fs, ft, CMPEQSS, true); break; case 4: //olt case 12: //lt CompFPComp(fs, ft, CMPLTSS); break; case 5: //ult case 13: //nge CompFPComp(ft, fs, CMPNLESS); break; case 6: //ole case 14: //le CompFPComp(fs, ft, CMPLESS); break; case 7: //ule case 15: //ngt CompFPComp(ft, fs, CMPNLTSS); break; default: DISABLE; } } void Jit::Comp_FPU2op(u32 op) { CONDITIONAL_DISABLE; int fs = _FS; int fd = _FD; switch (op & 0x3f) { case 5: //F(fd) = fabsf(F(fs)); break; //abs fpr.SpillLock(fd, fs); fpr.BindToRegister(fd, fd == fs, true); MOVSS(fpr.RX(fd), fpr.R(fs)); PAND(fpr.RX(fd), M((void *)ssNoSignMask)); fpr.ReleaseSpillLocks(); break; case 6: //F(fd) = F(fs); break; //mov if (fd != fs) { fpr.SpillLock(fd, fs); fpr.BindToRegister(fd, fd == fs, true); MOVSS(fpr.RX(fd), fpr.R(fs)); fpr.ReleaseSpillLocks(); } break; case 7: //F(fd) = -F(fs); break; //neg fpr.SpillLock(fd, fs); fpr.BindToRegister(fd, fd == fs, true); MOVSS(fpr.RX(fd), fpr.R(fs)); PXOR(fpr.RX(fd), M((void *)ssSignBits2)); fpr.ReleaseSpillLocks(); break; case 4: //F(fd) = sqrtf(F(fs)); break; //sqrt fpr.SpillLock(fd, fs); // this probably works, just badly tested fpr.BindToRegister(fd, fd == fs, true); SQRTSS(fpr.RX(fd), fpr.R(fs)); fpr.ReleaseSpillLocks(); return; case 13: //FsI(fd) = F(fs)>=0 ? (int)floorf(F(fs)) : (int)ceilf(F(fs)); break;//trunc.w.s fpr.SpillLock(fs, fd); fpr.StoreFromRegister(fd); CVTTSS2SI(EAX, fpr.R(fs)); MOV(32, fpr.R(fd), R(EAX)); fpr.ReleaseSpillLocks(); break; case 32: //F(fd) = (float)FsI(fs); break; //cvt.s.w fpr.StoreFromRegister(fs); CVTSI2SS(XMM0, fpr.R(fs)); MOVSS(fpr.R(fd), XMM0); break; case 12: //FsI(fd) = (int)floorf(F(fs)+0.5f); break; //round.w.s case 14: //FsI(fd) = (int)ceilf (F(fs)); break; //ceil.w.s case 15: //FsI(fd) = (int)floorf(F(fs)); break; //floor.w.s case 36: //FsI(fd) = (int) F(fs); break; //cvt.w.s default: Comp_Generic(op); return; } } void Jit::Comp_mxc1(u32 op) { CONDITIONAL_DISABLE; int fs = _FS; int rt = _RT; switch((op >> 21) & 0x1f) { case 0: // R(rt) = FI(fs); break; //mfc1 if (rt != 0) { // Cross move! slightly tricky fpr.StoreFromRegister(fs); gpr.Lock(rt); gpr.BindToRegister(rt, false, true); MOV(32, gpr.R(rt), fpr.R(fs)); gpr.UnlockAll(); } return; case 2: // R(rt) = currentMIPS->ReadFCR(fs); break; //cfc1 Comp_Generic(op); return; case 4: //FI(fs) = R(rt); break; //mtc1 // Cross move! slightly tricky gpr.StoreFromRegister(rt); fpr.SpillLock(fs); fpr.BindToRegister(fs, false, true); MOVSS(fpr.RX(fs), gpr.R(rt)); fpr.ReleaseSpillLocks(); return; case 6: //currentMIPS->WriteFCR(fs, R(rt)); break; //ctc1 Comp_Generic(op); return; } } } // namespace MIPSComp