Merge pull request #11139 from JosJuice/jit64-nans-no-freg
Jit64: Don't use fregsIn in HandleNaNs
This commit is contained in:
commit
22bcf134bf
|
@ -126,7 +126,8 @@ public:
|
||||||
void FinalizeSingleResult(Gen::X64Reg output, const Gen::OpArg& input, bool packed = true,
|
void FinalizeSingleResult(Gen::X64Reg output, const Gen::OpArg& input, bool packed = true,
|
||||||
bool duplicate = false);
|
bool duplicate = false);
|
||||||
void FinalizeDoubleResult(Gen::X64Reg output, const Gen::OpArg& input);
|
void FinalizeDoubleResult(Gen::X64Reg output, const Gen::OpArg& input);
|
||||||
void HandleNaNs(UGeckoInstruction inst, Gen::X64Reg xmm, Gen::X64Reg clobber);
|
void HandleNaNs(UGeckoInstruction inst, Gen::X64Reg xmm, Gen::X64Reg clobber,
|
||||||
|
std::vector<int> inputs);
|
||||||
|
|
||||||
void MultiplyImmediate(u32 imm, int a, int d, bool overflow);
|
void MultiplyImmediate(u32 imm, int a, int d, bool overflow);
|
||||||
|
|
||||||
|
|
|
@ -92,7 +92,7 @@ void Jit64::FinalizeDoubleResult(X64Reg output, const OpArg& input)
|
||||||
SetFPRFIfNeeded(input, false);
|
SetFPRFIfNeeded(input, false);
|
||||||
}
|
}
|
||||||
|
|
||||||
void Jit64::HandleNaNs(UGeckoInstruction inst, X64Reg xmm, X64Reg clobber)
|
void Jit64::HandleNaNs(UGeckoInstruction inst, X64Reg xmm, X64Reg clobber, std::vector<int> inputs)
|
||||||
{
|
{
|
||||||
// | PowerPC | x86
|
// | PowerPC | x86
|
||||||
// ---------------------+----------+---------
|
// ---------------------+----------+---------
|
||||||
|
@ -107,14 +107,13 @@ void Jit64::HandleNaNs(UGeckoInstruction inst, X64Reg xmm, X64Reg clobber)
|
||||||
|
|
||||||
ASSERT(xmm != clobber);
|
ASSERT(xmm != clobber);
|
||||||
|
|
||||||
std::vector<u32> inputs;
|
// Remove duplicates from inputs
|
||||||
u32 a = inst.FA, b = inst.FB, c = inst.FC;
|
for (auto it = inputs.begin(); it != inputs.end();)
|
||||||
for (u32 i : {a, b, c})
|
|
||||||
{
|
{
|
||||||
if (!js.op->fregsIn[i])
|
if (std::find(inputs.begin(), it, *it) != it)
|
||||||
continue;
|
it = inputs.erase(it);
|
||||||
if (std::find(inputs.begin(), inputs.end(), i) == inputs.end())
|
else
|
||||||
inputs.push_back(i);
|
++it;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.OPCD != 4)
|
if (inst.OPCD != 4)
|
||||||
|
@ -128,7 +127,7 @@ void Jit64::HandleNaNs(UGeckoInstruction inst, X64Reg xmm, X64Reg clobber)
|
||||||
|
|
||||||
// If any inputs are NaNs, pick the first NaN of them
|
// If any inputs are NaNs, pick the first NaN of them
|
||||||
std::vector<FixupBranch> fixups;
|
std::vector<FixupBranch> fixups;
|
||||||
for (u32 x : inputs)
|
for (int x : inputs)
|
||||||
{
|
{
|
||||||
RCOpArg Rx = fpr.Use(x, RCMode::Read);
|
RCOpArg Rx = fpr.Use(x, RCMode::Read);
|
||||||
RegCache::Realize(Rx);
|
RegCache::Realize(Rx);
|
||||||
|
@ -168,7 +167,7 @@ void Jit64::HandleNaNs(UGeckoInstruction inst, X64Reg xmm, X64Reg clobber)
|
||||||
BLENDVPD(xmm, MConst(psGeneratedQNaN));
|
BLENDVPD(xmm, MConst(psGeneratedQNaN));
|
||||||
|
|
||||||
// If any inputs are NaNs, use those instead
|
// If any inputs are NaNs, use those instead
|
||||||
for (u32 x : inputs)
|
for (int x : inputs)
|
||||||
{
|
{
|
||||||
RCOpArg Rx = fpr.Use(x, RCMode::Read);
|
RCOpArg Rx = fpr.Use(x, RCMode::Read);
|
||||||
RegCache::Realize(Rx);
|
RegCache::Realize(Rx);
|
||||||
|
@ -198,7 +197,7 @@ void Jit64::HandleNaNs(UGeckoInstruction inst, X64Reg xmm, X64Reg clobber)
|
||||||
MOVAPD(xmm, tmp);
|
MOVAPD(xmm, tmp);
|
||||||
|
|
||||||
// If any inputs are NaNs, use those instead
|
// If any inputs are NaNs, use those instead
|
||||||
for (u32 x : inputs)
|
for (int x : inputs)
|
||||||
{
|
{
|
||||||
RCOpArg Rx = fpr.Use(x, RCMode::Read);
|
RCOpArg Rx = fpr.Use(x, RCMode::Read);
|
||||||
RegCache::Realize(Rx);
|
RegCache::Realize(Rx);
|
||||||
|
@ -277,7 +276,7 @@ void Jit64::fp_arith(UGeckoInstruction inst)
|
||||||
avx_op(avxOp, sseOp, dest, Rop1, Rop2, packed, reversible);
|
avx_op(avxOp, sseOp, dest, Rop1, Rop2, packed, reversible);
|
||||||
}
|
}
|
||||||
|
|
||||||
HandleNaNs(inst, dest, XMM0);
|
HandleNaNs(inst, dest, XMM0, {op1, op2});
|
||||||
if (single)
|
if (single)
|
||||||
FinalizeSingleResult(Rd, R(dest), packed, true);
|
FinalizeSingleResult(Rd, R(dest), packed, true);
|
||||||
else
|
else
|
||||||
|
@ -500,7 +499,7 @@ void Jit64::fmaddXX(UGeckoInstruction inst)
|
||||||
result_xmm = Rd;
|
result_xmm = Rd;
|
||||||
}
|
}
|
||||||
|
|
||||||
HandleNaNs(inst, result_xmm, XMM0);
|
HandleNaNs(inst, result_xmm, XMM0, {a, b, c});
|
||||||
|
|
||||||
if (single)
|
if (single)
|
||||||
FinalizeSingleResult(Rd, R(result_xmm), packed, true);
|
FinalizeSingleResult(Rd, R(result_xmm), packed, true);
|
||||||
|
|
|
@ -77,7 +77,7 @@ void Jit64::ps_sum(UGeckoInstruction inst)
|
||||||
default:
|
default:
|
||||||
PanicAlertFmt("ps_sum WTF!!!");
|
PanicAlertFmt("ps_sum WTF!!!");
|
||||||
}
|
}
|
||||||
HandleNaNs(inst, tmp, tmp == XMM1 ? XMM0 : XMM1);
|
HandleNaNs(inst, tmp, tmp == XMM1 ? XMM0 : XMM1, {a, b, c});
|
||||||
FinalizeSingleResult(Rd, R(tmp));
|
FinalizeSingleResult(Rd, R(tmp));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -112,7 +112,7 @@ void Jit64::ps_muls(UGeckoInstruction inst)
|
||||||
if (round_input)
|
if (round_input)
|
||||||
Force25BitPrecision(XMM1, R(XMM1), XMM0);
|
Force25BitPrecision(XMM1, R(XMM1), XMM0);
|
||||||
MULPD(XMM1, Ra);
|
MULPD(XMM1, Ra);
|
||||||
HandleNaNs(inst, XMM1, XMM0);
|
HandleNaNs(inst, XMM1, XMM0, {a, c});
|
||||||
FinalizeSingleResult(Rd, R(XMM1));
|
FinalizeSingleResult(Rd, R(XMM1));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue