A little bit more WIP JIT work.

git-svn-id: https://dolphin-emu.googlecode.com/svn/trunk@1809 8ced0084-cf51-0410-be5f-012b33b47a6e
This commit is contained in:
magumagu9 2009-01-06 08:39:32 +00:00
parent f95937bc2e
commit e4f8419be4
3 changed files with 67 additions and 32 deletions

View File

@ -1063,6 +1063,8 @@ static void DoWriteCode(IRBuilder* ibuild, Jit64* Jit, bool UseProfile) {
case ExpandPackedToMReg: case ExpandPackedToMReg:
case CompactMRegToPacked: case CompactMRegToPacked:
case FPNeg: case FPNeg:
case FPDup0:
case FPDup1:
case FSNeg: case FSNeg:
case FDNeg: case FDNeg:
if (thisUsed) if (thisUsed)
@ -1604,6 +1606,24 @@ static void DoWriteCode(IRBuilder* ibuild, Jit64* Jit, bool UseProfile) {
fregNormalRegClear(RI, I); fregNormalRegClear(RI, I);
break; break;
} }
case FPDup0: {
if (!thisUsed) break;
X64Reg reg = fregFindFreeReg(RI);
Jit->MOVAPD(reg, fregLocForInst(RI, getOp1(I)));
Jit->PUNPCKLDQ(reg, R(reg));
RI.fregs[reg] = I;
fregNormalRegClear(RI, I);
break;
}
case FPDup1: {
if (!thisUsed) break;
X64Reg reg = fregFindFreeReg(RI);
Jit->MOVAPD(reg, fregLocForInst(RI, getOp1(I)));
Jit->SHUFPS(reg, R(reg), 0xE5);
RI.fregs[reg] = I;
fregNormalRegClear(RI, I);
break;
}
case LoadFReg: { case LoadFReg: {
if (!thisUsed) break; if (!thisUsed) break;
X64Reg reg = fregFindFreeReg(RI); X64Reg reg = fregFindFreeReg(RI);

View File

@ -171,6 +171,8 @@ namespace IREmitter {
FPMerge01, FPMerge01,
FPMerge10, FPMerge10,
FPMerge11, FPMerge11,
FPDup0,
FPDup1,
FResult_End, FResult_End,
StorePaired, StorePaired,
StoreSingle, StoreSingle,
@ -463,6 +465,12 @@ namespace IREmitter {
InstLoc EmitFPMerge11(InstLoc op1, InstLoc op2) { InstLoc EmitFPMerge11(InstLoc op1, InstLoc op2) {
return FoldBiOp(FPMerge11, op1, op2); return FoldBiOp(FPMerge11, op1, op2);
} }
InstLoc EmitFPDup0(InstLoc op1) {
return FoldUOp(FPDup0, op1);
}
InstLoc EmitFPDup1(InstLoc op1) {
return FoldUOp(FPDup1, op1);
}
InstLoc EmitFPNeg(InstLoc op1) { InstLoc EmitFPNeg(InstLoc op1) {
return FoldUOp(FPNeg, op1); return FoldUOp(FPNeg, op1);
} }

View File

@ -230,40 +230,23 @@
void Jit64::ps_muls(UGeckoInstruction inst) void Jit64::ps_muls(UGeckoInstruction inst)
{ {
if(Core::g_CoreStartupParameter.bJITOff || Core::g_CoreStartupParameter.bJITPairedOff)
{Default(inst); return;} // turn off from debugger
INSTRUCTION_START;
if (inst.Rc) { if (inst.Rc) {
Default(inst); return; Default(inst); return;
} }
int d = inst.FD; IREmitter::InstLoc val = ibuild.EmitLoadFReg(inst.FA),
int a = inst.FA; rhs = ibuild.EmitLoadFReg(inst.FC);
int c = inst.FC;
fpr.Lock(a, c, d); val = ibuild.EmitCompactMRegToPacked(val);
fpr.LoadToX64(d, d == a || d == c, true); rhs = ibuild.EmitCompactMRegToPacked(rhs);
switch (inst.SUBOP5)
{ if (inst.SUBOP5 == 12)
case 12: rhs = ibuild.EmitFPDup0(rhs);
// Single multiply scalar high else
// TODO - faster version for when regs are different rhs = ibuild.EmitFPDup1(rhs);
MOVAPD(XMM0, fpr.R(a));
MOVDDUP(XMM1, fpr.R(c)); val = ibuild.EmitFPMul(val, rhs);
MULPD(XMM0, R(XMM1)); val = ibuild.EmitExpandPackedToMReg(val);
MOVAPD(fpr.R(d), XMM0); ibuild.EmitStoreFReg(val, inst.FD);
break;
case 13:
// TODO - faster version for when regs are different
MOVAPD(XMM0, fpr.R(a));
MOVAPD(XMM1, fpr.R(c));
SHUFPD(XMM1, R(XMM1), 3); // copy higher to lower
MULPD(XMM0, R(XMM1));
MOVAPD(fpr.R(d), XMM0);
break;
default:
PanicAlert("ps_muls WTF!!!");
}
ForceSinglePrecisionP(fpr.RX(d));
fpr.UnlockAll();
} }
@ -301,7 +284,7 @@
void Jit64::ps_maddXX(UGeckoInstruction inst) void Jit64::ps_maddXX(UGeckoInstruction inst)
{ {
if (inst.Rc || (inst.SUBOP5 != 28 && inst.SUBOP5 != 29 && inst.SUBOP5 != 30)) { if (inst.Rc) {
Default(inst); return; Default(inst); return;
} }
@ -309,6 +292,22 @@
val = ibuild.EmitCompactMRegToPacked(val); val = ibuild.EmitCompactMRegToPacked(val);
switch (inst.SUBOP5) switch (inst.SUBOP5)
{ {
case 14: {//madds0
op2 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FC));
op2 = ibuild.EmitFPDup0(op2);
val = ibuild.EmitFPMul(val, op2);
op3 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FB));
val = ibuild.EmitFPAdd(val, op3);
break;
}
case 15: {//madds1
op2 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FC));
op2 = ibuild.EmitFPDup1(op2);
val = ibuild.EmitFPMul(val, op2);
op3 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FB));
val = ibuild.EmitFPAdd(val, op3);
break;
}
case 28: {//msub case 28: {//msub
op2 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FC)); op2 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FC));
val = ibuild.EmitFPMul(val, op2); val = ibuild.EmitFPMul(val, op2);
@ -331,6 +330,14 @@
val = ibuild.EmitFPNeg(val); val = ibuild.EmitFPNeg(val);
break; break;
} }
case 31: {//nmadd
op2 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FC));
val = ibuild.EmitFPMul(val, op2);
op3 = ibuild.EmitCompactMRegToPacked(ibuild.EmitLoadFReg(inst.FB));
val = ibuild.EmitFPAdd(val, op3);
val = ibuild.EmitFPNeg(val);
break;
}
} }
val = ibuild.EmitExpandPackedToMReg(val); val = ibuild.EmitExpandPackedToMReg(val);
ibuild.EmitStoreFReg(val, inst.FD); ibuild.EmitStoreFReg(val, inst.FD);