crXXX: Avoid loading twice when CRBA == CRBB

This commit is contained in:
MerryMage 2018-12-21 11:19:03 +00:00
parent 07c146e7e2
commit 174d2b0230
1 changed files with 31 additions and 14 deletions

View File

@ -552,23 +552,40 @@ void Jit64::crXXX(UGeckoInstruction inst)
JITDISABLE(bJITSystemRegistersOff); JITDISABLE(bJITSystemRegistersOff);
DEBUG_ASSERT_MSG(DYNA_REC, inst.OPCD == 19, "Invalid crXXX"); DEBUG_ASSERT_MSG(DYNA_REC, inst.OPCD == 19, "Invalid crXXX");
// Special case: crclr // TODO(merry): Futher optimizations can be performed here. For example,
if (inst.CRBA == inst.CRBB && inst.SUBOP10 == 193) // instead of extracting each CR field bit then setting it, the operation
// could be performed on the internal format directly instead and the
// relevant bit result can be masked out.
if (inst.CRBA == inst.CRBB)
{ {
switch (inst.SUBOP10)
{
// crclr
case 129: // crandc: A && ~B => 0
case 193: // crxor: A ^ B => 0
ClearCRFieldBit(inst.CRBD >> 2, 3 - (inst.CRBD & 3)); ClearCRFieldBit(inst.CRBD >> 2, 3 - (inst.CRBD & 3));
return; return;
}
// Special case: crset // crset
if (inst.CRBA == inst.CRBB && inst.SUBOP10 == 289) case 289: // creqv: ~(A ^ B) => 1
{ case 417: // crorc: A || ~B => 1
SetCRFieldBit(inst.CRBD >> 2, 3 - (inst.CRBD & 3)); SetCRFieldBit(inst.CRBD >> 2, 3 - (inst.CRBD & 3));
return; return;
}
// TODO(delroth): Potential optimizations could be applied here. For case 257: // crand: A && B => A
// instance, if the two CR bits being loaded are the same, two loads are case 449: // cror: A || B => A
// not required. GetCRFieldBit(inst.CRBA >> 2, 3 - (inst.CRBA & 3), RSCRATCH, false);
SetCRFieldBit(inst.CRBD >> 2, 3 - (inst.CRBD & 3), RSCRATCH);
return;
case 33: // crnor: ~(A || B) => ~A
case 225: // crnand: ~(A && B) => ~A
GetCRFieldBit(inst.CRBA >> 2, 3 - (inst.CRBA & 3), RSCRATCH, true);
SetCRFieldBit(inst.CRBD >> 2, 3 - (inst.CRBD & 3), RSCRATCH);
return;
}
}
// creqv or crnand or crnor // creqv or crnand or crnor
bool negateA = inst.SUBOP10 == 289 || inst.SUBOP10 == 225 || inst.SUBOP10 == 33; bool negateA = inst.SUBOP10 == 289 || inst.SUBOP10 == 225 || inst.SUBOP10 == 33;