mirror of
https://github.com/dolphin-emu/dolphin.git
synced 2025-01-24 15:01:16 +01:00
Merge pull request #12868 from Sintendo/scoped-reg
JitArm64: Release temporary regs with RAII
This commit is contained in:
commit
c212c0d08e
@ -262,12 +262,11 @@ void JitArm64::FallBackToInterpreter(UGeckoInstruction inst)
|
|||||||
if (js.op->canEndBlock)
|
if (js.op->canEndBlock)
|
||||||
{
|
{
|
||||||
// also flush the program counter
|
// also flush the program counter
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
MOVI2R(WA, js.compilerPC);
|
MOVI2R(WA, js.compilerPC);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(pc));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(pc));
|
||||||
ADD(WA, WA, 4);
|
ADD(WA, WA, 4);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(npc));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(npc));
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
Interpreter::Instruction instr = Interpreter::GetInterpreterOp(inst);
|
Interpreter::Instruction instr = Interpreter::GetInterpreterOp(inst);
|
||||||
@ -283,24 +282,23 @@ void JitArm64::FallBackToInterpreter(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
if (js.isLastInstruction)
|
if (js.isLastInstruction)
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(npc));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(npc));
|
||||||
WriteExceptionExit(WA);
|
WriteExceptionExit(WA);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
// only exit if ppcstate.npc was changed
|
// only exit if ppcstate.npc was changed
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(npc));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(npc));
|
||||||
ARM64Reg WB = gpr.GetReg();
|
{
|
||||||
|
auto WB = gpr.GetScopedReg();
|
||||||
MOVI2R(WB, js.compilerPC + 4);
|
MOVI2R(WB, js.compilerPC + 4);
|
||||||
CMP(WB, WA);
|
CMP(WB, WA);
|
||||||
gpr.Unlock(WB);
|
}
|
||||||
FixupBranch c = B(CC_EQ);
|
FixupBranch c = B(CC_EQ);
|
||||||
WriteExceptionExit(WA);
|
WriteExceptionExit(WA);
|
||||||
SetJumpTarget(c);
|
SetJumpTarget(c);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else if (ShouldHandleFPExceptionForInstruction(js.op))
|
else if (ShouldHandleFPExceptionForInstruction(js.op))
|
||||||
@ -399,11 +397,12 @@ void JitArm64::IntializeSpeculativeConstants()
|
|||||||
SwitchToNearCode();
|
SwitchToNearCode();
|
||||||
}
|
}
|
||||||
|
|
||||||
ARM64Reg tmp = gpr.GetReg();
|
{
|
||||||
|
auto tmp = gpr.GetScopedReg();
|
||||||
ARM64Reg value = gpr.R(i);
|
ARM64Reg value = gpr.R(i);
|
||||||
MOVI2R(tmp, compile_time_value);
|
MOVI2R(tmp, compile_time_value);
|
||||||
CMP(value, tmp);
|
CMP(value, tmp);
|
||||||
gpr.Unlock(tmp);
|
}
|
||||||
|
|
||||||
FixupBranch no_fail = B(CCFlags::CC_EQ);
|
FixupBranch no_fail = B(CCFlags::CC_EQ);
|
||||||
B(fail);
|
B(fail);
|
||||||
@ -442,16 +441,15 @@ void JitArm64::MSRUpdated(u32 msr)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
MOVI2R(WA, feature_flags);
|
MOVI2R(WA, feature_flags);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(feature_flags));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(feature_flags));
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::MSRUpdated(ARM64Reg msr)
|
void JitArm64::MSRUpdated(ARM64Reg msr)
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
|
|
||||||
// Update mem_ptr
|
// Update mem_ptr
|
||||||
@ -472,8 +470,6 @@ void JitArm64::MSRUpdated(ARM64Reg msr)
|
|||||||
if (other_feature_flags != 0)
|
if (other_feature_flags != 0)
|
||||||
ORR(WA, WA, LogicalImm(other_feature_flags, GPRSize::B32));
|
ORR(WA, WA, LogicalImm(other_feature_flags, GPRSize::B32));
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(feature_flags));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(feature_flags));
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::WriteExit(u32 destination, bool LK, u32 exit_address_after_return,
|
void JitArm64::WriteExit(u32 destination, bool LK, u32 exit_address_after_return,
|
||||||
@ -671,13 +667,16 @@ void JitArm64::FakeLKExit(u32 exit_address_after_return, ARM64Reg exit_address_a
|
|||||||
// function has been called!
|
// function has been called!
|
||||||
gpr.Lock(ARM64Reg::W30);
|
gpr.Lock(ARM64Reg::W30);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
const u8* host_address_after_return;
|
||||||
|
{
|
||||||
// Push {ARM_PC (64-bit); PPC_PC (32-bit); feature_flags (32-bit)} on the stack
|
// Push {ARM_PC (64-bit); PPC_PC (32-bit); feature_flags (32-bit)} on the stack
|
||||||
ARM64Reg after_reg = ARM64Reg::INVALID_REG;
|
Arm64RegCache::ScopedARM64Reg after_reg;
|
||||||
ARM64Reg reg_to_push;
|
ARM64Reg reg_to_push;
|
||||||
const u64 feature_flags = m_ppc_state.feature_flags;
|
const u64 feature_flags = m_ppc_state.feature_flags;
|
||||||
if (exit_address_after_return_reg == ARM64Reg::INVALID_REG)
|
if (exit_address_after_return_reg == ARM64Reg::INVALID_REG)
|
||||||
{
|
{
|
||||||
after_reg = gpr.GetReg();
|
after_reg = gpr.GetScopedReg();
|
||||||
reg_to_push = EncodeRegTo64(after_reg);
|
reg_to_push = EncodeRegTo64(after_reg);
|
||||||
MOVI2R(reg_to_push, feature_flags << 32 | exit_address_after_return);
|
MOVI2R(reg_to_push, feature_flags << 32 | exit_address_after_return);
|
||||||
}
|
}
|
||||||
@ -687,19 +686,18 @@ void JitArm64::FakeLKExit(u32 exit_address_after_return, ARM64Reg exit_address_a
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
after_reg = gpr.GetReg();
|
after_reg = gpr.GetScopedReg();
|
||||||
reg_to_push = EncodeRegTo64(after_reg);
|
reg_to_push = EncodeRegTo64(after_reg);
|
||||||
ORRI2R(reg_to_push, EncodeRegTo64(exit_address_after_return_reg), feature_flags << 32,
|
ORRI2R(reg_to_push, EncodeRegTo64(exit_address_after_return_reg), feature_flags << 32,
|
||||||
reg_to_push);
|
reg_to_push);
|
||||||
}
|
}
|
||||||
ARM64Reg code_reg = gpr.GetReg();
|
|
||||||
|
auto code_reg = gpr.GetScopedReg();
|
||||||
constexpr s32 adr_offset = sizeof(u32) * 3;
|
constexpr s32 adr_offset = sizeof(u32) * 3;
|
||||||
const u8* host_address_after_return = GetCodePtr() + adr_offset;
|
host_address_after_return = GetCodePtr() + adr_offset;
|
||||||
ADR(EncodeRegTo64(code_reg), adr_offset);
|
ADR(EncodeRegTo64(code_reg), adr_offset);
|
||||||
STP(IndexType::Pre, EncodeRegTo64(code_reg), reg_to_push, ARM64Reg::SP, -16);
|
STP(IndexType::Pre, EncodeRegTo64(code_reg), reg_to_push, ARM64Reg::SP, -16);
|
||||||
gpr.Unlock(code_reg);
|
}
|
||||||
if (after_reg != ARM64Reg::INVALID_REG)
|
|
||||||
gpr.Unlock(after_reg);
|
|
||||||
|
|
||||||
FixupBranch skip_exit = BL();
|
FixupBranch skip_exit = BL();
|
||||||
DEBUG_ASSERT(GetCodePtr() == host_address_after_return || HasWriteFailed());
|
DEBUG_ASSERT(GetCodePtr() == host_address_after_return || HasWriteFailed());
|
||||||
@ -832,10 +830,9 @@ void JitArm64::WriteExceptionExit(ARM64Reg dest, bool only_external, bool always
|
|||||||
|
|
||||||
void JitArm64::WriteConditionalExceptionExit(int exception, u64 increment_sp_on_exit)
|
void JitArm64::WriteConditionalExceptionExit(int exception, u64 increment_sp_on_exit)
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
WriteConditionalExceptionExit(exception, WA, Arm64Gen::ARM64Reg::INVALID_REG,
|
WriteConditionalExceptionExit(exception, WA, Arm64Gen::ARM64Reg::INVALID_REG,
|
||||||
increment_sp_on_exit);
|
increment_sp_on_exit);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::WriteConditionalExceptionExit(int exception, ARM64Reg temp_gpr, ARM64Reg temp_fpr,
|
void JitArm64::WriteConditionalExceptionExit(int exception, ARM64Reg temp_gpr, ARM64Reg temp_fpr,
|
||||||
@ -1227,7 +1224,7 @@ bool JitArm64::DoJit(u32 em_address, JitBlock* b, u32 nextPC)
|
|||||||
// asynchronous.
|
// asynchronous.
|
||||||
if (jo.optimizeGatherPipe && gatherPipeIntCheck)
|
if (jo.optimizeGatherPipe && gatherPipeIntCheck)
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
||||||
@ -1253,8 +1250,6 @@ bool JitArm64::DoJit(u32 em_address, JitBlock* b, u32 nextPC)
|
|||||||
SwitchToNearCode();
|
SwitchToNearCode();
|
||||||
SetJumpTarget(no_ext_exception);
|
SetJumpTarget(no_ext_exception);
|
||||||
SetJumpTarget(exit);
|
SetJumpTarget(exit);
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -1268,12 +1263,11 @@ bool JitArm64::DoJit(u32 em_address, JitBlock* b, u32 nextPC)
|
|||||||
// The only thing that currently sets op.skip is the BLR following optimization.
|
// The only thing that currently sets op.skip is the BLR following optimization.
|
||||||
// If any non-branch instruction starts setting that too, this will need to be changed.
|
// If any non-branch instruction starts setting that too, this will need to be changed.
|
||||||
ASSERT(op.inst.hex == 0x4e800020);
|
ASSERT(op.inst.hex == 0x4e800020);
|
||||||
const ARM64Reg bw_reg_a = gpr.GetReg(), bw_reg_b = gpr.GetReg();
|
const auto bw_reg_a = gpr.GetScopedReg(), bw_reg_b = gpr.GetScopedReg();
|
||||||
const BitSet32 gpr_caller_save =
|
const BitSet32 gpr_caller_save =
|
||||||
gpr.GetCallerSavedUsed() & ~BitSet32{DecodeReg(bw_reg_a), DecodeReg(bw_reg_b)};
|
gpr.GetCallerSavedUsed() & ~BitSet32{DecodeReg(bw_reg_a), DecodeReg(bw_reg_b)};
|
||||||
WriteBranchWatch<true>(op.address, op.branchTo, op.inst, bw_reg_a, bw_reg_b,
|
WriteBranchWatch<true>(op.address, op.branchTo, op.inst, bw_reg_a, bw_reg_b,
|
||||||
gpr_caller_save, fpr.GetCallerSavedUsed());
|
gpr_caller_save, fpr.GetCallerSavedUsed());
|
||||||
gpr.Unlock(bw_reg_a, bw_reg_b);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
@ -1311,10 +1305,12 @@ bool JitArm64::DoJit(u32 em_address, JitBlock* b, u32 nextPC)
|
|||||||
|
|
||||||
if ((opinfo->flags & FL_USE_FPU) && !js.firstFPInstructionFound)
|
if ((opinfo->flags & FL_USE_FPU) && !js.firstFPInstructionFound)
|
||||||
{
|
{
|
||||||
|
FixupBranch b1;
|
||||||
// This instruction uses FPU - needs to add FP exception bailout
|
// This instruction uses FPU - needs to add FP exception bailout
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(msr));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(msr));
|
||||||
FixupBranch b1 = TBNZ(WA, 13); // Test FP enabled bit
|
b1 = TBNZ(WA, 13); // Test FP enabled bit
|
||||||
|
|
||||||
FixupBranch far_addr = B();
|
FixupBranch far_addr = B();
|
||||||
SwitchToFarCode();
|
SwitchToFarCode();
|
||||||
@ -1326,8 +1322,7 @@ bool JitArm64::DoJit(u32 em_address, JitBlock* b, u32 nextPC)
|
|||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
||||||
ORR(WA, WA, LogicalImm(EXCEPTION_FPU_UNAVAILABLE, GPRSize::B32));
|
ORR(WA, WA, LogicalImm(EXCEPTION_FPU_UNAVAILABLE, GPRSize::B32));
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
||||||
|
}
|
||||||
gpr.Unlock(WA);
|
|
||||||
|
|
||||||
WriteExceptionExit(js.compilerPC, false, true);
|
WriteExceptionExit(js.compilerPC, false, true);
|
||||||
|
|
||||||
|
@ -24,13 +24,12 @@ void JitArm64::sc(UGeckoInstruction inst)
|
|||||||
gpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
gpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
||||||
fpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
fpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
||||||
ORR(WA, WA, LogicalImm(EXCEPTION_SYSCALL, GPRSize::B32));
|
ORR(WA, WA, LogicalImm(EXCEPTION_SYSCALL, GPRSize::B32));
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(Exceptions));
|
||||||
|
}
|
||||||
gpr.Unlock(WA);
|
|
||||||
|
|
||||||
WriteExceptionExit(js.compilerPC + 4, false, true);
|
WriteExceptionExit(js.compilerPC + 4, false, true);
|
||||||
}
|
}
|
||||||
@ -51,9 +50,10 @@ void JitArm64::rfi(UGeckoInstruction inst)
|
|||||||
// R1 = MSR contents
|
// R1 = MSR contents
|
||||||
// R2 = Mask
|
// R2 = Mask
|
||||||
// R3 = Mask
|
// R3 = Mask
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WB = gpr.GetReg();
|
{
|
||||||
ARM64Reg WC = gpr.GetReg();
|
auto WB = gpr.GetScopedReg();
|
||||||
|
auto WC = gpr.GetScopedReg();
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WC, PPC_REG, PPCSTATE_OFF(msr));
|
LDR(IndexType::Unsigned, WC, PPC_REG, PPCSTATE_OFF(msr));
|
||||||
|
|
||||||
@ -65,14 +65,13 @@ void JitArm64::rfi(UGeckoInstruction inst)
|
|||||||
ORR(WA, WA, WC); // rB = Masked MSR OR masked SRR1
|
ORR(WA, WA, WC); // rB = Masked MSR OR masked SRR1
|
||||||
|
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(msr)); // STR rB in to rA
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(msr)); // STR rB in to rA
|
||||||
gpr.Unlock(WB, WC);
|
}
|
||||||
|
|
||||||
MSRUpdated(WA);
|
MSRUpdated(WA);
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF_SPR(SPR_SRR0));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF_SPR(SPR_SRR0));
|
||||||
|
|
||||||
WriteExceptionExit(WA);
|
WriteExceptionExit(WA);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
template <bool condition>
|
template <bool condition>
|
||||||
@ -144,10 +143,10 @@ void JitArm64::bx(UGeckoInstruction inst)
|
|||||||
INSTRUCTION_START
|
INSTRUCTION_START
|
||||||
JITDISABLE(bJITBranchOff);
|
JITDISABLE(bJITBranchOff);
|
||||||
|
|
||||||
ARM64Reg WA = ARM64Reg::INVALID_REG;
|
Arm64GPRCache::ScopedARM64Reg WA = ARM64Reg::INVALID_REG;
|
||||||
if (inst.LK)
|
if (inst.LK)
|
||||||
{
|
{
|
||||||
WA = gpr.GetReg();
|
WA = gpr.GetScopedReg();
|
||||||
MOVI2R(WA, js.compilerPC + 4);
|
MOVI2R(WA, js.compilerPC + 4);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF_SPR(SPR_LR));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF_SPR(SPR_LR));
|
||||||
}
|
}
|
||||||
@ -156,13 +155,12 @@ void JitArm64::bx(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
if (IsDebuggingEnabled())
|
if (IsDebuggingEnabled())
|
||||||
{
|
{
|
||||||
const ARM64Reg WB = gpr.GetReg(), WC = gpr.GetReg();
|
const auto WB = gpr.GetScopedReg(), WC = gpr.GetScopedReg();
|
||||||
BitSet32 gpr_caller_save = gpr.GetCallerSavedUsed() & ~BitSet32{DecodeReg(WB), DecodeReg(WC)};
|
BitSet32 gpr_caller_save = gpr.GetCallerSavedUsed() & ~BitSet32{DecodeReg(WB), DecodeReg(WC)};
|
||||||
if (WA != ARM64Reg::INVALID_REG && js.op->skipLRStack)
|
if (WA != ARM64Reg::INVALID_REG && js.op->skipLRStack)
|
||||||
gpr_caller_save[DecodeReg(WA)] = false;
|
gpr_caller_save[DecodeReg(WA)] = false;
|
||||||
WriteBranchWatch<true>(js.compilerPC, js.op->branchTo, inst, WB, WC, gpr_caller_save,
|
WriteBranchWatch<true>(js.compilerPC, js.op->branchTo, inst, WB, WC, gpr_caller_save,
|
||||||
fpr.GetCallerSavedUsed());
|
fpr.GetCallerSavedUsed());
|
||||||
gpr.Unlock(WB, WC);
|
|
||||||
}
|
}
|
||||||
if (inst.LK && !js.op->skipLRStack)
|
if (inst.LK && !js.op->skipLRStack)
|
||||||
{
|
{
|
||||||
@ -172,9 +170,6 @@ void JitArm64::bx(UGeckoInstruction inst)
|
|||||||
FakeLKExit(js.compilerPC + 4, WA);
|
FakeLKExit(js.compilerPC + 4, WA);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (WA != ARM64Reg::INVALID_REG)
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
|
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -184,13 +179,12 @@ void JitArm64::bx(UGeckoInstruction inst)
|
|||||||
if (js.op->branchIsIdleLoop)
|
if (js.op->branchIsIdleLoop)
|
||||||
{
|
{
|
||||||
if (WA == ARM64Reg::INVALID_REG)
|
if (WA == ARM64Reg::INVALID_REG)
|
||||||
WA = gpr.GetReg();
|
WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
if (IsDebuggingEnabled())
|
if (IsDebuggingEnabled())
|
||||||
{
|
{
|
||||||
const ARM64Reg WB = gpr.GetReg();
|
const auto WB = gpr.GetScopedReg();
|
||||||
WriteBranchWatch<true>(js.compilerPC, js.op->branchTo, inst, WA, WB, {}, {});
|
WriteBranchWatch<true>(js.compilerPC, js.op->branchTo, inst, WA, WB, {}, {});
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// make idle loops go faster
|
// make idle loops go faster
|
||||||
@ -198,7 +192,7 @@ void JitArm64::bx(UGeckoInstruction inst)
|
|||||||
|
|
||||||
MOVP2R(XA, &CoreTiming::GlobalIdle);
|
MOVP2R(XA, &CoreTiming::GlobalIdle);
|
||||||
BLR(XA);
|
BLR(XA);
|
||||||
gpr.Unlock(WA);
|
WA.Unlock();
|
||||||
|
|
||||||
WriteExceptionExit(js.op->branchTo);
|
WriteExceptionExit(js.op->branchTo);
|
||||||
return;
|
return;
|
||||||
@ -206,16 +200,12 @@ void JitArm64::bx(UGeckoInstruction inst)
|
|||||||
|
|
||||||
if (IsDebuggingEnabled())
|
if (IsDebuggingEnabled())
|
||||||
{
|
{
|
||||||
const ARM64Reg WB = gpr.GetReg(), WC = gpr.GetReg();
|
const auto WB = gpr.GetScopedReg(), WC = gpr.GetScopedReg();
|
||||||
const BitSet32 gpr_caller_save =
|
const BitSet32 gpr_caller_save =
|
||||||
WA != ARM64Reg::INVALID_REG ? BitSet32{DecodeReg(WA)} & CALLER_SAVED_GPRS : BitSet32{};
|
WA != ARM64Reg::INVALID_REG ? BitSet32{DecodeReg(WA)} & CALLER_SAVED_GPRS : BitSet32{};
|
||||||
WriteBranchWatch<true>(js.compilerPC, js.op->branchTo, inst, WB, WC, gpr_caller_save, {});
|
WriteBranchWatch<true>(js.compilerPC, js.op->branchTo, inst, WB, WC, gpr_caller_save, {});
|
||||||
gpr.Unlock(WB, WC);
|
|
||||||
}
|
}
|
||||||
WriteExit(js.op->branchTo, inst.LK, js.compilerPC + 4, WA);
|
WriteExit(js.op->branchTo, inst.LK, js.compilerPC + 4, WA);
|
||||||
|
|
||||||
if (WA != ARM64Reg::INVALID_REG)
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::bcx(UGeckoInstruction inst)
|
void JitArm64::bcx(UGeckoInstruction inst)
|
||||||
@ -223,10 +213,14 @@ void JitArm64::bcx(UGeckoInstruction inst)
|
|||||||
INSTRUCTION_START
|
INSTRUCTION_START
|
||||||
JITDISABLE(bJITBranchOff);
|
JITDISABLE(bJITBranchOff);
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WB = inst.LK || IsDebuggingEnabled() ? gpr.GetReg() : WA;
|
auto WB = inst.LK || IsDebuggingEnabled() ? gpr.GetScopedReg() :
|
||||||
ARM64Reg WC = IsDebuggingEnabled() && inst.LK && !js.op->branchIsIdleLoop ? gpr.GetReg() :
|
Arm64GPRCache::ScopedARM64Reg(WA.GetReg());
|
||||||
ARM64Reg::INVALID_REG;
|
|
||||||
|
{
|
||||||
|
auto WC = IsDebuggingEnabled() && inst.LK && !js.op->branchIsIdleLoop ?
|
||||||
|
gpr.GetScopedReg() :
|
||||||
|
Arm64GPRCache::ScopedARM64Reg(ARM64Reg::INVALID_REG);
|
||||||
|
|
||||||
FixupBranch pCTRDontBranch;
|
FixupBranch pCTRDontBranch;
|
||||||
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0) // Decrement and test CTR
|
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0) // Decrement and test CTR
|
||||||
@ -290,9 +284,7 @@ void JitArm64::bcx(UGeckoInstruction inst)
|
|||||||
SetJumpTarget(pConditionDontBranch);
|
SetJumpTarget(pConditionDontBranch);
|
||||||
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0)
|
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0)
|
||||||
SetJumpTarget(pCTRDontBranch);
|
SetJumpTarget(pCTRDontBranch);
|
||||||
|
}
|
||||||
if (WC != ARM64Reg::INVALID_REG)
|
|
||||||
gpr.Unlock(WC);
|
|
||||||
|
|
||||||
if (!analyzer.HasOption(PPCAnalyst::PPCAnalyzer::OPTION_CONDITIONAL_CONTINUE))
|
if (!analyzer.HasOption(PPCAnalyst::PPCAnalyzer::OPTION_CONDITIONAL_CONTINUE))
|
||||||
{
|
{
|
||||||
@ -311,10 +303,6 @@ void JitArm64::bcx(UGeckoInstruction inst)
|
|||||||
WriteBranchWatch<false>(js.compilerPC, js.compilerPC + 4, inst, WA, WB, gpr_caller_save,
|
WriteBranchWatch<false>(js.compilerPC, js.compilerPC + 4, inst, WA, WB, gpr_caller_save,
|
||||||
fpr.GetCallerSavedUsed());
|
fpr.GetCallerSavedUsed());
|
||||||
}
|
}
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
if (WB != WA)
|
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::bcctrx(UGeckoInstruction inst)
|
void JitArm64::bcctrx(UGeckoInstruction inst)
|
||||||
@ -337,34 +325,29 @@ void JitArm64::bcctrx(UGeckoInstruction inst)
|
|||||||
gpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
gpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
||||||
fpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
fpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
||||||
|
|
||||||
ARM64Reg WB = ARM64Reg::INVALID_REG;
|
Arm64GPRCache::ScopedARM64Reg WB = ARM64Reg::INVALID_REG;
|
||||||
if (inst.LK_3)
|
if (inst.LK_3)
|
||||||
{
|
{
|
||||||
WB = gpr.GetReg();
|
WB = gpr.GetScopedReg();
|
||||||
MOVI2R(WB, js.compilerPC + 4);
|
MOVI2R(WB, js.compilerPC + 4);
|
||||||
STR(IndexType::Unsigned, WB, PPC_REG, PPCSTATE_OFF_SPR(SPR_LR));
|
STR(IndexType::Unsigned, WB, PPC_REG, PPCSTATE_OFF_SPR(SPR_LR));
|
||||||
}
|
}
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF_SPR(SPR_CTR));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF_SPR(SPR_CTR));
|
||||||
AND(WA, WA, LogicalImm(~0x3, GPRSize::B32));
|
AND(WA, WA, LogicalImm(~0x3, GPRSize::B32));
|
||||||
|
|
||||||
if (IsDebuggingEnabled())
|
if (IsDebuggingEnabled())
|
||||||
{
|
{
|
||||||
const ARM64Reg WC = gpr.GetReg(), WD = gpr.GetReg();
|
const auto WC = gpr.GetScopedReg(), WD = gpr.GetScopedReg();
|
||||||
BitSet32 gpr_caller_save = BitSet32{DecodeReg(WA)};
|
BitSet32 gpr_caller_save = BitSet32{DecodeReg(WA)};
|
||||||
if (WB != ARM64Reg::INVALID_REG)
|
if (WB != ARM64Reg::INVALID_REG)
|
||||||
gpr_caller_save[DecodeReg(WB)] = true;
|
gpr_caller_save[DecodeReg(WB)] = true;
|
||||||
gpr_caller_save &= CALLER_SAVED_GPRS;
|
gpr_caller_save &= CALLER_SAVED_GPRS;
|
||||||
WriteBranchWatchDestInRegister(js.compilerPC, WA, inst, WC, WD, gpr_caller_save, {});
|
WriteBranchWatchDestInRegister(js.compilerPC, WA, inst, WC, WD, gpr_caller_save, {});
|
||||||
gpr.Unlock(WC, WD);
|
|
||||||
}
|
}
|
||||||
WriteExit(WA, inst.LK_3, js.compilerPC + 4, WB);
|
WriteExit(WA, inst.LK_3, js.compilerPC + 4, WB);
|
||||||
|
|
||||||
if (WB != ARM64Reg::INVALID_REG)
|
|
||||||
gpr.Unlock(WB);
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::bclrx(UGeckoInstruction inst)
|
void JitArm64::bclrx(UGeckoInstruction inst)
|
||||||
@ -375,10 +358,19 @@ void JitArm64::bclrx(UGeckoInstruction inst)
|
|||||||
bool conditional =
|
bool conditional =
|
||||||
(inst.BO & BO_DONT_DECREMENT_FLAG) == 0 || (inst.BO & BO_DONT_CHECK_CONDITION) == 0;
|
(inst.BO & BO_DONT_DECREMENT_FLAG) == 0 || (inst.BO & BO_DONT_CHECK_CONDITION) == 0;
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WB =
|
Arm64GPRCache::ScopedARM64Reg WB;
|
||||||
conditional || inst.LK || IsDebuggingEnabled() ? gpr.GetReg() : ARM64Reg::INVALID_REG;
|
if (conditional || inst.LK || IsDebuggingEnabled())
|
||||||
ARM64Reg WC = IsDebuggingEnabled() ? gpr.GetReg() : ARM64Reg::INVALID_REG;
|
{
|
||||||
|
WB = gpr.GetScopedReg();
|
||||||
|
}
|
||||||
|
|
||||||
|
{
|
||||||
|
Arm64GPRCache::ScopedARM64Reg WC;
|
||||||
|
if (IsDebuggingEnabled())
|
||||||
|
{
|
||||||
|
WC = gpr.GetScopedReg();
|
||||||
|
}
|
||||||
|
|
||||||
FixupBranch pCTRDontBranch;
|
FixupBranch pCTRDontBranch;
|
||||||
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0) // Decrement and test CTR
|
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0) // Decrement and test CTR
|
||||||
@ -451,9 +443,7 @@ void JitArm64::bclrx(UGeckoInstruction inst)
|
|||||||
SetJumpTarget(pConditionDontBranch);
|
SetJumpTarget(pConditionDontBranch);
|
||||||
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0)
|
if ((inst.BO & BO_DONT_DECREMENT_FLAG) == 0)
|
||||||
SetJumpTarget(pCTRDontBranch);
|
SetJumpTarget(pCTRDontBranch);
|
||||||
|
}
|
||||||
if (WC != ARM64Reg::INVALID_REG)
|
|
||||||
gpr.Unlock(WC);
|
|
||||||
|
|
||||||
if (!analyzer.HasOption(PPCAnalyst::PPCAnalyzer::OPTION_CONDITIONAL_CONTINUE))
|
if (!analyzer.HasOption(PPCAnalyst::PPCAnalyzer::OPTION_CONDITIONAL_CONTINUE))
|
||||||
{
|
{
|
||||||
@ -472,8 +462,4 @@ void JitArm64::bclrx(UGeckoInstruction inst)
|
|||||||
WriteBranchWatch<false>(js.compilerPC, js.compilerPC + 4, inst, WA, WB, gpr_caller_save,
|
WriteBranchWatch<false>(js.compilerPC, js.compilerPC + 4, inst, WA, WB, gpr_caller_save,
|
||||||
fpr.GetCallerSavedUsed());
|
fpr.GetCallerSavedUsed());
|
||||||
}
|
}
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
if (WB != ARM64Reg::INVALID_REG)
|
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
|
@ -102,15 +102,16 @@ void JitArm64::fp_arith(UGeckoInstruction inst)
|
|||||||
const ARM64Reg VC = use_c ? reg_encoder(fpr.R(c, type)) : ARM64Reg::INVALID_REG;
|
const ARM64Reg VC = use_c ? reg_encoder(fpr.R(c, type)) : ARM64Reg::INVALID_REG;
|
||||||
const ARM64Reg VD = reg_encoder(fpr.RW(d, type_out));
|
const ARM64Reg VD = reg_encoder(fpr.RW(d, type_out));
|
||||||
|
|
||||||
ARM64Reg V0Q = ARM64Reg::INVALID_REG;
|
{
|
||||||
ARM64Reg V1Q = ARM64Reg::INVALID_REG;
|
Arm64FPRCache::ScopedARM64Reg V0Q = ARM64Reg::INVALID_REG;
|
||||||
|
Arm64FPRCache::ScopedARM64Reg V1Q = ARM64Reg::INVALID_REG;
|
||||||
|
|
||||||
ARM64Reg rounded_c_reg = VC;
|
ARM64Reg rounded_c_reg = VC;
|
||||||
if (round_c)
|
if (round_c)
|
||||||
{
|
{
|
||||||
ASSERT_MSG(DYNA_REC, !inputs_are_singles, "Tried to apply 25-bit precision to single");
|
ASSERT_MSG(DYNA_REC, !inputs_are_singles, "Tried to apply 25-bit precision to single");
|
||||||
|
|
||||||
V0Q = fpr.GetReg();
|
V0Q = fpr.GetScopedReg();
|
||||||
rounded_c_reg = reg_encoder(V0Q);
|
rounded_c_reg = reg_encoder(V0Q);
|
||||||
Force25BitPrecision(rounded_c_reg, VC);
|
Force25BitPrecision(rounded_c_reg, VC);
|
||||||
}
|
}
|
||||||
@ -119,7 +120,7 @@ void JitArm64::fp_arith(UGeckoInstruction inst)
|
|||||||
if (fma && inaccurate_fma && VD == VB)
|
if (fma && inaccurate_fma && VD == VB)
|
||||||
{
|
{
|
||||||
if (V0Q == ARM64Reg::INVALID_REG)
|
if (V0Q == ARM64Reg::INVALID_REG)
|
||||||
V0Q = fpr.GetReg();
|
V0Q = fpr.GetScopedReg();
|
||||||
inaccurate_fma_reg = reg_encoder(V0Q);
|
inaccurate_fma_reg = reg_encoder(V0Q);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -128,7 +129,7 @@ void JitArm64::fp_arith(UGeckoInstruction inst)
|
|||||||
m_accurate_nans && (VD == VA || (use_b && VD == VB) || (use_c && VD == VC));
|
m_accurate_nans && (VD == VA || (use_b && VD == VB) || (use_c && VD == VC));
|
||||||
if (preserve_d)
|
if (preserve_d)
|
||||||
{
|
{
|
||||||
V1Q = fpr.GetReg();
|
V1Q = fpr.GetScopedReg();
|
||||||
result_reg = reg_encoder(V1Q);
|
result_reg = reg_encoder(V1Q);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -244,11 +245,7 @@ void JitArm64::fp_arith(UGeckoInstruction inst)
|
|||||||
|
|
||||||
for (FixupBranch fixup : nan_fixups)
|
for (FixupBranch fixup : nan_fixups)
|
||||||
SetJumpTarget(fixup);
|
SetJumpTarget(fixup);
|
||||||
|
}
|
||||||
if (V0Q != ARM64Reg::INVALID_REG)
|
|
||||||
fpr.Unlock(V0Q);
|
|
||||||
if (V1Q != ARM64Reg::INVALID_REG)
|
|
||||||
fpr.Unlock(V1Q);
|
|
||||||
|
|
||||||
if (output_is_single)
|
if (output_is_single)
|
||||||
{
|
{
|
||||||
@ -449,19 +446,20 @@ void JitArm64::FloatCompare(UGeckoInstruction inst, bool upper)
|
|||||||
gpr.BindCRToRegister(crf, false);
|
gpr.BindCRToRegister(crf, false);
|
||||||
const ARM64Reg XA = gpr.CR(crf);
|
const ARM64Reg XA = gpr.CR(crf);
|
||||||
|
|
||||||
ARM64Reg fpscr_reg = ARM64Reg::INVALID_REG;
|
Arm64GPRCache::ScopedARM64Reg fpscr_reg = ARM64Reg::INVALID_REG;
|
||||||
if (fprf)
|
if (fprf)
|
||||||
{
|
{
|
||||||
fpscr_reg = gpr.GetReg();
|
fpscr_reg = gpr.GetScopedReg();
|
||||||
LDR(IndexType::Unsigned, fpscr_reg, PPC_REG, PPCSTATE_OFF(fpscr));
|
LDR(IndexType::Unsigned, fpscr_reg, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
AND(fpscr_reg, fpscr_reg, LogicalImm(~FPCC_MASK, GPRSize::B32));
|
AND(fpscr_reg, fpscr_reg, LogicalImm(~FPCC_MASK, GPRSize::B32));
|
||||||
}
|
}
|
||||||
|
|
||||||
ARM64Reg V0Q = ARM64Reg::INVALID_REG;
|
{
|
||||||
ARM64Reg V1Q = ARM64Reg::INVALID_REG;
|
Arm64FPRCache::ScopedARM64Reg V0Q;
|
||||||
|
Arm64FPRCache::ScopedARM64Reg V1Q;
|
||||||
if (upper_a)
|
if (upper_a)
|
||||||
{
|
{
|
||||||
V0Q = fpr.GetReg();
|
V0Q = fpr.GetScopedReg();
|
||||||
m_float_emit.DUP(singles ? 32 : 64, paired_reg_encoder(V0Q), paired_reg_encoder(VA), 1);
|
m_float_emit.DUP(singles ? 32 : 64, paired_reg_encoder(V0Q), paired_reg_encoder(VA), 1);
|
||||||
VA = reg_encoder(V0Q);
|
VA = reg_encoder(V0Q);
|
||||||
}
|
}
|
||||||
@ -473,18 +471,14 @@ void JitArm64::FloatCompare(UGeckoInstruction inst, bool upper)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
V1Q = fpr.GetReg();
|
V1Q = fpr.GetScopedReg();
|
||||||
m_float_emit.DUP(singles ? 32 : 64, paired_reg_encoder(V1Q), paired_reg_encoder(VB), 1);
|
m_float_emit.DUP(singles ? 32 : 64, paired_reg_encoder(V1Q), paired_reg_encoder(VB), 1);
|
||||||
VB = reg_encoder(V1Q);
|
VB = reg_encoder(V1Q);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
m_float_emit.FCMP(VA, VB);
|
m_float_emit.FCMP(VA, VB);
|
||||||
|
}
|
||||||
if (V0Q != ARM64Reg::INVALID_REG)
|
|
||||||
fpr.Unlock(V0Q);
|
|
||||||
if (V1Q != ARM64Reg::INVALID_REG)
|
|
||||||
fpr.Unlock(V1Q);
|
|
||||||
|
|
||||||
FixupBranch pNaN, pLesser, pGreater;
|
FixupBranch pNaN, pLesser, pGreater;
|
||||||
FixupBranch continue1, continue2, continue3;
|
FixupBranch continue1, continue2, continue3;
|
||||||
@ -538,7 +532,6 @@ void JitArm64::FloatCompare(UGeckoInstruction inst, bool upper)
|
|||||||
if (fprf)
|
if (fprf)
|
||||||
{
|
{
|
||||||
STR(IndexType::Unsigned, fpscr_reg, PPC_REG, PPCSTATE_OFF(fpscr));
|
STR(IndexType::Unsigned, fpscr_reg, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
gpr.Unlock(fpscr_reg);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -572,7 +565,7 @@ void JitArm64::fctiwx(UGeckoInstruction inst)
|
|||||||
|
|
||||||
if (single)
|
if (single)
|
||||||
{
|
{
|
||||||
const ARM64Reg V0 = fpr.GetReg();
|
const auto V0 = fpr.GetScopedReg();
|
||||||
|
|
||||||
if (is_fctiwzx)
|
if (is_fctiwzx)
|
||||||
{
|
{
|
||||||
@ -589,12 +582,10 @@ void JitArm64::fctiwx(UGeckoInstruction inst)
|
|||||||
m_float_emit.BIC(16, EncodeRegToDouble(V0), 0x7);
|
m_float_emit.BIC(16, EncodeRegToDouble(V0), 0x7);
|
||||||
|
|
||||||
m_float_emit.ORR(EncodeRegToDouble(VD), EncodeRegToDouble(VD), EncodeRegToDouble(V0));
|
m_float_emit.ORR(EncodeRegToDouble(VD), EncodeRegToDouble(VD), EncodeRegToDouble(V0));
|
||||||
|
|
||||||
fpr.Unlock(V0);
|
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
const ARM64Reg WA = gpr.GetReg();
|
const auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
if (is_fctiwzx)
|
if (is_fctiwzx)
|
||||||
{
|
{
|
||||||
@ -608,8 +599,6 @@ void JitArm64::fctiwx(UGeckoInstruction inst)
|
|||||||
|
|
||||||
ORR(EncodeRegTo64(WA), EncodeRegTo64(WA), LogicalImm(0xFFF8'0000'0000'0000ULL, GPRSize::B64));
|
ORR(EncodeRegTo64(WA), EncodeRegTo64(WA), LogicalImm(0xFFF8'0000'0000'0000ULL, GPRSize::B64));
|
||||||
m_float_emit.FMOV(EncodeRegToDouble(VD), EncodeRegTo64(WA));
|
m_float_emit.FMOV(EncodeRegToDouble(VD), EncodeRegTo64(WA));
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
ASSERT_MSG(DYNA_REC, b == d || single == fpr.IsSingle(b, true),
|
ASSERT_MSG(DYNA_REC, b == d || single == fpr.IsSingle(b, true),
|
||||||
|
@ -86,10 +86,9 @@ void JitArm64::LoadCarry()
|
|||||||
{
|
{
|
||||||
case CarryFlag::InPPCState:
|
case CarryFlag::InPPCState:
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
CMP(WA, 1);
|
CMP(WA, 1);
|
||||||
gpr.Unlock(WA);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::InHostCarry:
|
case CarryFlag::InHostCarry:
|
||||||
@ -119,18 +118,16 @@ void JitArm64::FlushCarry()
|
|||||||
}
|
}
|
||||||
case CarryFlag::InHostCarry:
|
case CarryFlag::InHostCarry:
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
CSET(WA, CC_CS);
|
CSET(WA, CC_CS);
|
||||||
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
gpr.Unlock(WA);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::ConstantTrue:
|
case CarryFlag::ConstantTrue:
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
MOVI2R(WA, 1);
|
MOVI2R(WA, 1);
|
||||||
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
gpr.Unlock(WA);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::ConstantFalse:
|
case CarryFlag::ConstantFalse:
|
||||||
@ -155,9 +152,10 @@ void JitArm64::reg_imm(u32 d, u32 a, u32 value, u32 (*do_op)(u32, u32),
|
|||||||
else
|
else
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(d, d == a);
|
gpr.BindToRegister(d, d == a);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
(this->*op)(gpr.R(d), gpr.R(a), value, WA);
|
(this->*op)(gpr.R(d), gpr.R(a), value, WA);
|
||||||
gpr.Unlock(WA);
|
}
|
||||||
|
|
||||||
if (Rc)
|
if (Rc)
|
||||||
ComputeRC0(gpr.R(d));
|
ComputeRC0(gpr.R(d));
|
||||||
@ -245,9 +243,8 @@ void JitArm64::addix(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
gpr.BindToRegister(d, d == a);
|
gpr.BindToRegister(d, d == a);
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ADDI2R(gpr.R(d), gpr.R(a), imm, WA);
|
ADDI2R(gpr.R(d), gpr.R(a), imm, WA);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
@ -544,9 +541,10 @@ void JitArm64::addx(UGeckoInstruction inst)
|
|||||||
int imm_value = gpr.GetImm(imm_reg);
|
int imm_value = gpr.GetImm(imm_reg);
|
||||||
|
|
||||||
gpr.BindToRegister(d, d == in_reg);
|
gpr.BindToRegister(d, d == in_reg);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
ADDI2R(gpr.R(d), gpr.R(in_reg), imm_value, WA);
|
ADDI2R(gpr.R(d), gpr.R(in_reg), imm_value, WA);
|
||||||
gpr.Unlock(WA);
|
}
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
ComputeRC0(gpr.R(d));
|
ComputeRC0(gpr.R(d));
|
||||||
}
|
}
|
||||||
@ -722,9 +720,8 @@ void JitArm64::cmpi(UGeckoInstruction inst)
|
|||||||
|
|
||||||
if (B != 0)
|
if (B != 0)
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
SUBI2R(CR, CR, B, EncodeRegTo64(WA));
|
SUBI2R(CR, CR, B, EncodeRegTo64(WA));
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -796,10 +793,9 @@ void JitArm64::rlwinmx_internal(UGeckoInstruction inst, u32 sh)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
MOVI2R(WA, mask);
|
MOVI2R(WA, mask);
|
||||||
AND(gpr.R(a), WA, gpr.R(s), ArithOption(gpr.R(s), ShiftType::ROR, 32 - sh));
|
AND(gpr.R(a), WA, gpr.R(s), ArithOption(gpr.R(s), ShiftType::ROR, 32 - sh));
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
@ -829,11 +825,12 @@ void JitArm64::rlwnmx(UGeckoInstruction inst)
|
|||||||
const u32 mask = MakeRotationMask(inst.MB, inst.ME);
|
const u32 mask = MakeRotationMask(inst.MB, inst.ME);
|
||||||
|
|
||||||
gpr.BindToRegister(a, a == s || a == b);
|
gpr.BindToRegister(a, a == s || a == b);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
NEG(WA, gpr.R(b));
|
NEG(WA, gpr.R(b));
|
||||||
RORV(gpr.R(a), gpr.R(s), WA);
|
RORV(gpr.R(a), gpr.R(s), WA);
|
||||||
ANDI2R(gpr.R(a), gpr.R(a), mask, WA);
|
ANDI2R(gpr.R(a), gpr.R(a), mask, WA);
|
||||||
gpr.Unlock(WA);
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
ComputeRC0(gpr.R(a));
|
ComputeRC0(gpr.R(a));
|
||||||
@ -878,8 +875,8 @@ void JitArm64::srawix(UGeckoInstruction inst)
|
|||||||
|
|
||||||
if (js.op->wantsCA)
|
if (js.op->wantsCA)
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg dest = inplace_carry ? WA : ARM64Reg::WSP;
|
ARM64Reg dest = inplace_carry ? ARM64Reg(WA) : ARM64Reg::WSP;
|
||||||
if (a != s)
|
if (a != s)
|
||||||
{
|
{
|
||||||
ASR(RA, RS, amount);
|
ASR(RA, RS, amount);
|
||||||
@ -901,7 +898,6 @@ void JitArm64::srawix(UGeckoInstruction inst)
|
|||||||
CSINC(WA, ARM64Reg::WSP, ARM64Reg::WSP, CC_EQ);
|
CSINC(WA, ARM64Reg::WSP, ARM64Reg::WSP, CC_EQ);
|
||||||
ComputeCarry(WA);
|
ComputeCarry(WA);
|
||||||
}
|
}
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
@ -936,9 +932,10 @@ void JitArm64::addic(UGeckoInstruction inst)
|
|||||||
else
|
else
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(d, d == a);
|
gpr.BindToRegister(d, d == a);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
CARRY_IF_NEEDED(ADDI2R, ADDSI2R, gpr.R(d), gpr.R(a), simm, WA);
|
CARRY_IF_NEEDED(ADDI2R, ADDSI2R, gpr.R(d), gpr.R(a), simm, WA);
|
||||||
gpr.Unlock(WA);
|
}
|
||||||
|
|
||||||
ComputeCarry();
|
ComputeCarry();
|
||||||
if (rc)
|
if (rc)
|
||||||
@ -1037,12 +1034,10 @@ void JitArm64::mulli(UGeckoInstruction inst)
|
|||||||
gpr.BindToRegister(d, allocate_reg);
|
gpr.BindToRegister(d, allocate_reg);
|
||||||
|
|
||||||
// Reuse d to hold the immediate if possible, allocate a register otherwise.
|
// Reuse d to hold the immediate if possible, allocate a register otherwise.
|
||||||
ARM64Reg WA = allocate_reg ? gpr.GetReg() : gpr.R(d);
|
auto WA = allocate_reg ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(gpr.R(d));
|
||||||
|
|
||||||
MOVI2R(WA, (u32)(s32)inst.SIMM_16);
|
MOVI2R(WA, (u32)(s32)inst.SIMM_16);
|
||||||
MUL(gpr.R(d), gpr.R(a), WA);
|
MUL(gpr.R(d), gpr.R(a), WA);
|
||||||
if (allocate_reg)
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -1137,16 +1132,16 @@ void JitArm64::addzex(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
case CarryFlag::InPPCState:
|
case CarryFlag::InPPCState:
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(d, d == a);
|
const bool allocate_reg = d == a;
|
||||||
ARM64Reg WA = d == a ? gpr.GetReg() : gpr.R(d);
|
gpr.BindToRegister(d, allocate_reg);
|
||||||
|
|
||||||
|
{
|
||||||
|
auto WA = allocate_reg ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(gpr.R(d));
|
||||||
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
CARRY_IF_NEEDED(ADD, ADDS, gpr.R(d), gpr.R(a), WA);
|
CARRY_IF_NEEDED(ADD, ADDS, gpr.R(d), gpr.R(a), WA);
|
||||||
|
}
|
||||||
|
|
||||||
ComputeCarry();
|
ComputeCarry();
|
||||||
|
|
||||||
if (d == a)
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::InHostCarry:
|
case CarryFlag::InHostCarry:
|
||||||
@ -1229,18 +1224,16 @@ void JitArm64::subfex(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
case CarryFlag::InPPCState:
|
case CarryFlag::InPPCState:
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
ADDI2R(gpr.R(d), WA, ~i + j, gpr.R(d));
|
ADDI2R(gpr.R(d), WA, ~i + j, gpr.R(d));
|
||||||
gpr.Unlock(WA);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::InHostCarry:
|
case CarryFlag::InHostCarry:
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
MOVI2R(WA, ~i + j);
|
MOVI2R(WA, ~i + j);
|
||||||
ADC(gpr.R(d), WA, ARM64Reg::WZR);
|
ADC(gpr.R(d), WA, ARM64Reg::WZR);
|
||||||
gpr.Unlock(WA);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::ConstantTrue:
|
case CarryFlag::ConstantTrue:
|
||||||
@ -1274,9 +1267,17 @@ void JitArm64::subfex(UGeckoInstruction inst)
|
|||||||
else
|
else
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(d, d == a || d == b);
|
gpr.BindToRegister(d, d == a || d == b);
|
||||||
ARM64Reg RB = mex ? gpr.GetReg() : gpr.R(b);
|
{
|
||||||
|
Arm64GPRCache::ScopedARM64Reg RB;
|
||||||
if (mex)
|
if (mex)
|
||||||
|
{
|
||||||
|
RB = gpr.GetScopedReg();
|
||||||
MOVI2R(RB, -1);
|
MOVI2R(RB, -1);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
RB = gpr.R(b);
|
||||||
|
}
|
||||||
|
|
||||||
if (js.carryFlag == CarryFlag::ConstantTrue)
|
if (js.carryFlag == CarryFlag::ConstantTrue)
|
||||||
{
|
{
|
||||||
@ -1287,10 +1288,9 @@ void JitArm64::subfex(UGeckoInstruction inst)
|
|||||||
LoadCarry();
|
LoadCarry();
|
||||||
CARRY_IF_NEEDED(SBC, SBCS, gpr.R(d), RB, gpr.R(a));
|
CARRY_IF_NEEDED(SBC, SBCS, gpr.R(d), RB, gpr.R(a));
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
ComputeCarry();
|
ComputeCarry();
|
||||||
if (mex)
|
|
||||||
gpr.Unlock(RB);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
@ -1343,12 +1343,13 @@ void JitArm64::subfzex(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
case CarryFlag::InPPCState:
|
case CarryFlag::InPPCState:
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
MVN(gpr.R(d), gpr.R(a));
|
MVN(gpr.R(d), gpr.R(a));
|
||||||
CARRY_IF_NEEDED(ADD, ADDS, gpr.R(d), gpr.R(d), WA);
|
CARRY_IF_NEEDED(ADD, ADDS, gpr.R(d), gpr.R(d), WA);
|
||||||
|
}
|
||||||
ComputeCarry();
|
ComputeCarry();
|
||||||
gpr.Unlock(WA);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::InHostCarry:
|
case CarryFlag::InHostCarry:
|
||||||
@ -1394,21 +1395,20 @@ void JitArm64::subfic(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
const bool will_read = d == a;
|
const bool will_read = d == a;
|
||||||
const bool is_zero = imm == 0;
|
const bool is_zero = imm == 0;
|
||||||
const bool allocate_reg = will_read && !is_zero;
|
|
||||||
gpr.BindToRegister(d, will_read);
|
gpr.BindToRegister(d, will_read);
|
||||||
|
|
||||||
// d = imm - a
|
// d = imm - a
|
||||||
ARM64Reg RD = gpr.R(d);
|
ARM64Reg RD = gpr.R(d);
|
||||||
ARM64Reg WA = ARM64Reg::WZR;
|
{
|
||||||
|
Arm64GPRCache::ScopedARM64Reg WA(ARM64Reg::WZR);
|
||||||
if (!is_zero)
|
if (!is_zero)
|
||||||
{
|
{
|
||||||
WA = will_read ? gpr.GetReg() : RD;
|
WA = will_read ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(RD);
|
||||||
MOVI2R(WA, imm);
|
MOVI2R(WA, imm);
|
||||||
}
|
}
|
||||||
CARRY_IF_NEEDED(SUB, SUBS, RD, WA, gpr.R(a));
|
|
||||||
|
|
||||||
if (allocate_reg)
|
CARRY_IF_NEEDED(SUB, SUBS, RD, WA, gpr.R(a));
|
||||||
gpr.Unlock(WA);
|
}
|
||||||
|
|
||||||
ComputeCarry();
|
ComputeCarry();
|
||||||
}
|
}
|
||||||
@ -1433,10 +1433,9 @@ void JitArm64::addex(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
case CarryFlag::InPPCState:
|
case CarryFlag::InPPCState:
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
ADDI2R(gpr.R(d), WA, i + j, gpr.R(d));
|
ADDI2R(gpr.R(d), WA, i + j, gpr.R(d));
|
||||||
gpr.Unlock(WA);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
case CarryFlag::InHostCarry:
|
case CarryFlag::InHostCarry:
|
||||||
@ -1477,9 +1476,17 @@ void JitArm64::addex(UGeckoInstruction inst)
|
|||||||
else
|
else
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(d, d == a || d == b);
|
gpr.BindToRegister(d, d == a || d == b);
|
||||||
ARM64Reg RB = mex ? gpr.GetReg() : gpr.R(b);
|
{
|
||||||
|
Arm64GPRCache::ScopedARM64Reg RB;
|
||||||
if (mex)
|
if (mex)
|
||||||
|
{
|
||||||
|
RB = gpr.GetScopedReg();
|
||||||
MOVI2R(RB, -1);
|
MOVI2R(RB, -1);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
RB = gpr.R(b);
|
||||||
|
}
|
||||||
|
|
||||||
if (js.carryFlag == CarryFlag::ConstantFalse)
|
if (js.carryFlag == CarryFlag::ConstantFalse)
|
||||||
{
|
{
|
||||||
@ -1490,10 +1497,9 @@ void JitArm64::addex(UGeckoInstruction inst)
|
|||||||
LoadCarry();
|
LoadCarry();
|
||||||
CARRY_IF_NEEDED(ADC, ADCS, gpr.R(d), gpr.R(a), RB);
|
CARRY_IF_NEEDED(ADC, ADCS, gpr.R(d), gpr.R(a), RB);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
ComputeCarry();
|
ComputeCarry();
|
||||||
if (mex)
|
|
||||||
gpr.Unlock(RB);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
@ -1575,7 +1581,7 @@ void JitArm64::divwux(UGeckoInstruction inst)
|
|||||||
{
|
{
|
||||||
UnsignedMagic m = UnsignedDivisionConstants(divisor);
|
UnsignedMagic m = UnsignedDivisionConstants(divisor);
|
||||||
|
|
||||||
ARM64Reg WI = allocate_reg ? gpr.GetReg() : RD;
|
auto WI = allocate_reg ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(RD);
|
||||||
ARM64Reg XD = EncodeRegTo64(RD);
|
ARM64Reg XD = EncodeRegTo64(RD);
|
||||||
|
|
||||||
MOVI2R(WI, m.multiplier);
|
MOVI2R(WI, m.multiplier);
|
||||||
@ -1590,9 +1596,6 @@ void JitArm64::divwux(UGeckoInstruction inst)
|
|||||||
}
|
}
|
||||||
|
|
||||||
LSR(XD, XD, 32 + m.shift);
|
LSR(XD, XD, 32 + m.shift);
|
||||||
|
|
||||||
if (allocate_reg)
|
|
||||||
gpr.Unlock(WI);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
@ -1719,7 +1722,7 @@ void JitArm64::divwx(UGeckoInstruction inst)
|
|||||||
ARM64Reg RA = gpr.R(a);
|
ARM64Reg RA = gpr.R(a);
|
||||||
ARM64Reg RD = gpr.R(d);
|
ARM64Reg RD = gpr.R(d);
|
||||||
|
|
||||||
ARM64Reg WA = allocate_reg ? gpr.GetReg() : RD;
|
auto WA = allocate_reg ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(RD);
|
||||||
|
|
||||||
TST(RA, RA);
|
TST(RA, RA);
|
||||||
ADDI2R(WA, RA, abs_val - 1, WA);
|
ADDI2R(WA, RA, abs_val - 1, WA);
|
||||||
@ -1729,9 +1732,6 @@ void JitArm64::divwx(UGeckoInstruction inst)
|
|||||||
NEG(RD, WA, ArithOption(WA, ShiftType::ASR, MathUtil::IntLog2(abs_val)));
|
NEG(RD, WA, ArithOption(WA, ShiftType::ASR, MathUtil::IntLog2(abs_val)));
|
||||||
else
|
else
|
||||||
ASR(RD, WA, MathUtil::IntLog2(abs_val));
|
ASR(RD, WA, MathUtil::IntLog2(abs_val));
|
||||||
|
|
||||||
if (allocate_reg)
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
@ -1739,8 +1739,8 @@ void JitArm64::divwx(UGeckoInstruction inst)
|
|||||||
SignedMagic m = SignedDivisionConstants(divisor);
|
SignedMagic m = SignedDivisionConstants(divisor);
|
||||||
|
|
||||||
ARM64Reg RD = gpr.R(d);
|
ARM64Reg RD = gpr.R(d);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WB = allocate_reg ? gpr.GetReg() : RD;
|
auto WB = allocate_reg ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(RD);
|
||||||
|
|
||||||
ARM64Reg XD = EncodeRegTo64(RD);
|
ARM64Reg XD = EncodeRegTo64(RD);
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
@ -1776,10 +1776,6 @@ void JitArm64::divwx(UGeckoInstruction inst)
|
|||||||
ASR(XD, XD, 32 + m.shift);
|
ASR(XD, XD, 32 + m.shift);
|
||||||
ADD(RD, WA, RD);
|
ADD(RD, WA, RD);
|
||||||
}
|
}
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
if (allocate_reg)
|
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
@ -1982,8 +1978,7 @@ void JitArm64::srawx(UGeckoInstruction inst)
|
|||||||
else
|
else
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(a, a == s);
|
gpr.BindToRegister(a, a == s);
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WA = gpr.GetReg();
|
|
||||||
|
|
||||||
if (a != s)
|
if (a != s)
|
||||||
{
|
{
|
||||||
@ -2009,8 +2004,6 @@ void JitArm64::srawx(UGeckoInstruction inst)
|
|||||||
|
|
||||||
CSET(WA, CC_NEQ);
|
CSET(WA, CC_NEQ);
|
||||||
ComputeCarry(WA);
|
ComputeCarry(WA);
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
@ -2018,8 +2011,8 @@ void JitArm64::srawx(UGeckoInstruction inst)
|
|||||||
const bool will_read = a == b || a == s;
|
const bool will_read = a == b || a == s;
|
||||||
gpr.BindToRegister(a, will_read);
|
gpr.BindToRegister(a, will_read);
|
||||||
|
|
||||||
const bool allocate_reg = will_read || js.op->wantsCA;
|
auto WA =
|
||||||
ARM64Reg WA = allocate_reg ? gpr.GetReg() : gpr.R(a);
|
will_read || js.op->wantsCA ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(gpr.R(a));
|
||||||
|
|
||||||
LSL(EncodeRegTo64(WA), EncodeRegTo64(gpr.R(s)), 32);
|
LSL(EncodeRegTo64(WA), EncodeRegTo64(gpr.R(s)), 32);
|
||||||
ASRV(EncodeRegTo64(WA), EncodeRegTo64(WA), EncodeRegTo64(gpr.R(b)));
|
ASRV(EncodeRegTo64(WA), EncodeRegTo64(WA), EncodeRegTo64(gpr.R(b)));
|
||||||
@ -2031,9 +2024,6 @@ void JitArm64::srawx(UGeckoInstruction inst)
|
|||||||
CSET(WA, CC_NEQ);
|
CSET(WA, CC_NEQ);
|
||||||
ComputeCarry(WA);
|
ComputeCarry(WA);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (allocate_reg)
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
@ -2088,10 +2078,9 @@ void JitArm64::rlwimix(UGeckoInstruction inst)
|
|||||||
// No rotation
|
// No rotation
|
||||||
// No mask inversion
|
// No mask inversion
|
||||||
gpr.BindToRegister(a, true);
|
gpr.BindToRegister(a, true);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
UBFX(WA, gpr.R(s), lsb, width);
|
UBFX(WA, gpr.R(s), lsb, width);
|
||||||
BFI(gpr.R(a), WA, lsb, width);
|
BFI(gpr.R(a), WA, lsb, width);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
else if (inst.SH && inst.MB <= inst.ME)
|
else if (inst.SH && inst.MB <= inst.ME)
|
||||||
{
|
{
|
||||||
@ -2103,28 +2092,22 @@ void JitArm64::rlwimix(UGeckoInstruction inst)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ROR(WA, gpr.R(s), (rot_dist + lsb) % 32);
|
ROR(WA, gpr.R(s), (rot_dist + lsb) % 32);
|
||||||
BFI(gpr.R(a), WA, lsb, width);
|
BFI(gpr.R(a), WA, lsb, width);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(a, true);
|
gpr.BindToRegister(a, true);
|
||||||
const bool allocate_reg = a == s;
|
|
||||||
ARM64Reg RA = gpr.R(a);
|
ARM64Reg RA = gpr.R(a);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WB = allocate_reg ? gpr.GetReg() : RA;
|
auto WB = a == s ? gpr.GetScopedReg() : Arm64GPRCache::ScopedARM64Reg(RA);
|
||||||
|
|
||||||
MOVI2R(WA, mask);
|
MOVI2R(WA, mask);
|
||||||
BIC(WB, RA, WA);
|
BIC(WB, RA, WA);
|
||||||
AND(WA, WA, gpr.R(s), ArithOption(gpr.R(s), ShiftType::ROR, rot_dist));
|
AND(WA, WA, gpr.R(s), ArithOption(gpr.R(s), ShiftType::ROR, rot_dist));
|
||||||
ORR(RA, WB, WA);
|
ORR(RA, WB, WA);
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
if (allocate_reg)
|
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.Rc)
|
if (inst.Rc)
|
||||||
|
@ -538,9 +538,12 @@ void JitArm64::lmw(UGeckoInstruction inst)
|
|||||||
else
|
else
|
||||||
ADDI2R(addr_reg, gpr.R(a), offset, addr_reg);
|
ADDI2R(addr_reg, gpr.R(a), offset, addr_reg);
|
||||||
|
|
||||||
ARM64Reg addr_base_reg = a_is_addr_base_reg ? ARM64Reg::INVALID_REG : gpr.GetReg();
|
Arm64RegCache::ScopedARM64Reg addr_base_reg;
|
||||||
if (!a_is_addr_base_reg)
|
if (!a_is_addr_base_reg)
|
||||||
|
{
|
||||||
|
addr_base_reg = gpr.GetScopedReg();
|
||||||
MOV(addr_base_reg, addr_reg);
|
MOV(addr_base_reg, addr_reg);
|
||||||
|
}
|
||||||
|
|
||||||
BitSet32 gprs_to_discard{};
|
BitSet32 gprs_to_discard{};
|
||||||
if (!jo.memcheck)
|
if (!jo.memcheck)
|
||||||
@ -628,8 +631,6 @@ void JitArm64::lmw(UGeckoInstruction inst)
|
|||||||
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W30);
|
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W30);
|
||||||
if (jo.memcheck || !jo.fastmem)
|
if (jo.memcheck || !jo.fastmem)
|
||||||
gpr.Unlock(ARM64Reg::W0);
|
gpr.Unlock(ARM64Reg::W0);
|
||||||
if (!a_is_addr_base_reg)
|
|
||||||
gpr.Unlock(addr_base_reg);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::stmw(UGeckoInstruction inst)
|
void JitArm64::stmw(UGeckoInstruction inst)
|
||||||
@ -655,9 +656,12 @@ void JitArm64::stmw(UGeckoInstruction inst)
|
|||||||
else
|
else
|
||||||
ADDI2R(addr_reg, gpr.R(a), offset, addr_reg);
|
ADDI2R(addr_reg, gpr.R(a), offset, addr_reg);
|
||||||
|
|
||||||
ARM64Reg addr_base_reg = a_is_addr_base_reg ? ARM64Reg::INVALID_REG : gpr.GetReg();
|
Arm64GPRCache::ScopedARM64Reg addr_base_reg;
|
||||||
if (!a_is_addr_base_reg)
|
if (!a_is_addr_base_reg)
|
||||||
|
{
|
||||||
|
addr_base_reg = gpr.GetScopedReg();
|
||||||
MOV(addr_base_reg, addr_reg);
|
MOV(addr_base_reg, addr_reg);
|
||||||
|
}
|
||||||
|
|
||||||
BitSet32 gprs_to_discard{};
|
BitSet32 gprs_to_discard{};
|
||||||
if (!jo.memcheck)
|
if (!jo.memcheck)
|
||||||
@ -748,8 +752,6 @@ void JitArm64::stmw(UGeckoInstruction inst)
|
|||||||
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
||||||
if (!jo.fastmem)
|
if (!jo.fastmem)
|
||||||
gpr.Unlock(ARM64Reg::W0);
|
gpr.Unlock(ARM64Reg::W0);
|
||||||
if (!a_is_addr_base_reg)
|
|
||||||
gpr.Unlock(addr_base_reg);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::dcbx(UGeckoInstruction inst)
|
void JitArm64::dcbx(UGeckoInstruction inst)
|
||||||
@ -786,8 +788,8 @@ void JitArm64::dcbx(UGeckoInstruction inst)
|
|||||||
// bdnz afterwards! So if we invalidate a single cache line, we don't adjust the registers at
|
// bdnz afterwards! So if we invalidate a single cache line, we don't adjust the registers at
|
||||||
// all, if we invalidate 2 cachelines we adjust the registers by one step, and so on.
|
// all, if we invalidate 2 cachelines we adjust the registers by one step, and so on.
|
||||||
|
|
||||||
const ARM64Reg reg_cycle_count = gpr.GetReg();
|
const auto reg_cycle_count = gpr.GetScopedReg();
|
||||||
const ARM64Reg reg_downcount = gpr.GetReg();
|
const auto reg_downcount = gpr.GetScopedReg();
|
||||||
|
|
||||||
// Figure out how many loops we want to do.
|
// Figure out how many loops we want to do.
|
||||||
const u8 cycle_count_per_loop =
|
const u8 cycle_count_per_loop =
|
||||||
@ -855,12 +857,9 @@ void JitArm64::dcbx(UGeckoInstruction inst)
|
|||||||
SetJumpTarget(branch_out);
|
SetJumpTarget(branch_out);
|
||||||
SetJumpTarget(branch_over);
|
SetJumpTarget(branch_over);
|
||||||
}
|
}
|
||||||
|
|
||||||
gpr.Unlock(reg_cycle_count, reg_downcount);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
constexpr ARM64Reg effective_addr = WB;
|
constexpr ARM64Reg effective_addr = WB;
|
||||||
const ARM64Reg physical_addr = gpr.GetReg();
|
|
||||||
|
|
||||||
if (a)
|
if (a)
|
||||||
ADD(effective_addr, gpr.R(a), gpr.R(b));
|
ADD(effective_addr, gpr.R(a), gpr.R(b));
|
||||||
@ -874,6 +873,8 @@ void JitArm64::dcbx(UGeckoInstruction inst)
|
|||||||
ADD(gpr.R(b), gpr.R(b), WA, ArithOption(WA, ShiftType::LSL, 5)); // Rb += (WA * 32)
|
ADD(gpr.R(b), gpr.R(b), WA, ArithOption(WA, ShiftType::LSL, 5)); // Rb += (WA * 32)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
auto physical_addr = gpr.GetScopedReg();
|
||||||
|
|
||||||
// Translate effective address to physical address.
|
// Translate effective address to physical address.
|
||||||
const u8* loop_start = GetCodePtr();
|
const u8* loop_start = GetCodePtr();
|
||||||
FixupBranch bat_lookup_failed;
|
FixupBranch bat_lookup_failed;
|
||||||
@ -939,7 +940,7 @@ void JitArm64::dcbx(UGeckoInstruction inst)
|
|||||||
SwitchToNearCode();
|
SwitchToNearCode();
|
||||||
SetJumpTarget(near_addr);
|
SetJumpTarget(near_addr);
|
||||||
|
|
||||||
gpr.Unlock(WA, WB, physical_addr);
|
gpr.Unlock(WA, WB);
|
||||||
if (make_loop)
|
if (make_loop)
|
||||||
gpr.Unlock(loop_counter);
|
gpr.Unlock(loop_counter);
|
||||||
}
|
}
|
||||||
|
@ -268,14 +268,14 @@ void JitArm64::stfXX(UGeckoInstruction inst)
|
|||||||
|
|
||||||
const bool have_single = fpr.IsSingle(inst.FS, true);
|
const bool have_single = fpr.IsSingle(inst.FS, true);
|
||||||
|
|
||||||
ARM64Reg V0 =
|
Arm64FPRCache::ScopedARM64Reg V0 =
|
||||||
fpr.R(inst.FS, want_single && have_single ? RegType::LowerPairSingle : RegType::LowerPair);
|
fpr.R(inst.FS, want_single && have_single ? RegType::LowerPairSingle : RegType::LowerPair);
|
||||||
|
|
||||||
if (want_single && !have_single)
|
if (want_single && !have_single)
|
||||||
{
|
{
|
||||||
const ARM64Reg single_reg = fpr.GetReg();
|
auto single_reg = fpr.GetScopedReg();
|
||||||
ConvertDoubleToSingleLower(inst.FS, single_reg, V0);
|
ConvertDoubleToSingleLower(inst.FS, single_reg, V0);
|
||||||
V0 = single_reg;
|
V0 = std::move(single_reg);
|
||||||
}
|
}
|
||||||
|
|
||||||
gpr.Lock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
gpr.Lock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
||||||
@ -425,9 +425,6 @@ void JitArm64::stfXX(UGeckoInstruction inst)
|
|||||||
MOV(gpr.R(a), addr_reg);
|
MOV(gpr.R(a), addr_reg);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (want_single && !have_single)
|
|
||||||
fpr.Unlock(V0);
|
|
||||||
|
|
||||||
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
||||||
fpr.Unlock(ARM64Reg::Q0);
|
fpr.Unlock(ARM64Reg::Q0);
|
||||||
if (!jo.fastmem)
|
if (!jo.fastmem)
|
||||||
|
@ -173,20 +173,21 @@ void JitArm64::psq_stXX(UGeckoInstruction inst)
|
|||||||
|
|
||||||
const bool have_single = fpr.IsSingle(inst.RS);
|
const bool have_single = fpr.IsSingle(inst.RS);
|
||||||
|
|
||||||
ARM64Reg VS = fpr.R(inst.RS, have_single ? RegType::Single : RegType::Register);
|
Arm64FPRCache::ScopedARM64Reg VS =
|
||||||
|
fpr.R(inst.RS, have_single ? RegType::Single : RegType::Register);
|
||||||
|
|
||||||
if (js.assumeNoPairedQuantize)
|
if (js.assumeNoPairedQuantize)
|
||||||
{
|
{
|
||||||
if (!have_single)
|
if (!have_single)
|
||||||
{
|
{
|
||||||
const ARM64Reg single_reg = fpr.GetReg();
|
auto single_reg = fpr.GetScopedReg();
|
||||||
|
|
||||||
if (w)
|
if (w)
|
||||||
m_float_emit.FCVT(32, 64, EncodeRegToDouble(single_reg), EncodeRegToDouble(VS));
|
m_float_emit.FCVT(32, 64, EncodeRegToDouble(single_reg), EncodeRegToDouble(VS));
|
||||||
else
|
else
|
||||||
m_float_emit.FCVTN(32, EncodeRegToDouble(single_reg), EncodeRegToDouble(VS));
|
m_float_emit.FCVTN(32, EncodeRegToDouble(single_reg), EncodeRegToDouble(VS));
|
||||||
|
|
||||||
VS = single_reg;
|
VS = std::move(single_reg);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
@ -279,9 +280,6 @@ void JitArm64::psq_stXX(UGeckoInstruction inst)
|
|||||||
MOV(gpr.R(inst.RA), addr_reg);
|
MOV(gpr.R(inst.RA), addr_reg);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (js.assumeNoPairedQuantize && !have_single)
|
|
||||||
fpr.Unlock(VS);
|
|
||||||
|
|
||||||
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
gpr.Unlock(ARM64Reg::W1, ARM64Reg::W2, ARM64Reg::W30);
|
||||||
fpr.Unlock(ARM64Reg::Q0);
|
fpr.Unlock(ARM64Reg::Q0);
|
||||||
if (!js.assumeNoPairedQuantize || !jo.fastmem)
|
if (!js.assumeNoPairedQuantize || !jo.fastmem)
|
||||||
|
@ -108,16 +108,17 @@ void JitArm64::ps_arith(UGeckoInstruction inst)
|
|||||||
const ARM64Reg VC = use_c ? reg_encoder(fpr.R(c, type)) : ARM64Reg::INVALID_REG;
|
const ARM64Reg VC = use_c ? reg_encoder(fpr.R(c, type)) : ARM64Reg::INVALID_REG;
|
||||||
const ARM64Reg VD = reg_encoder(fpr.RW(d, type));
|
const ARM64Reg VD = reg_encoder(fpr.RW(d, type));
|
||||||
|
|
||||||
ARM64Reg V0Q = ARM64Reg::INVALID_REG;
|
{
|
||||||
ARM64Reg V1Q = ARM64Reg::INVALID_REG;
|
Arm64FPRCache::ScopedARM64Reg V0Q = ARM64Reg::INVALID_REG;
|
||||||
ARM64Reg V2Q = ARM64Reg::INVALID_REG;
|
Arm64FPRCache::ScopedARM64Reg V1Q = ARM64Reg::INVALID_REG;
|
||||||
|
Arm64FPRCache::ScopedARM64Reg V2Q = ARM64Reg::INVALID_REG;
|
||||||
|
|
||||||
ARM64Reg rounded_c_reg = VC;
|
ARM64Reg rounded_c_reg = VC;
|
||||||
if (round_c)
|
if (round_c)
|
||||||
{
|
{
|
||||||
ASSERT_MSG(DYNA_REC, !singles, "Tried to apply 25-bit precision to single");
|
ASSERT_MSG(DYNA_REC, !singles, "Tried to apply 25-bit precision to single");
|
||||||
|
|
||||||
V0Q = fpr.GetReg();
|
V0Q = fpr.GetScopedReg();
|
||||||
rounded_c_reg = reg_encoder(V0Q);
|
rounded_c_reg = reg_encoder(V0Q);
|
||||||
Force25BitPrecision(rounded_c_reg, VC);
|
Force25BitPrecision(rounded_c_reg, VC);
|
||||||
}
|
}
|
||||||
@ -126,7 +127,7 @@ void JitArm64::ps_arith(UGeckoInstruction inst)
|
|||||||
if (fma && inaccurate_fma && VD == VB)
|
if (fma && inaccurate_fma && VD == VB)
|
||||||
{
|
{
|
||||||
if (V0Q == ARM64Reg::INVALID_REG)
|
if (V0Q == ARM64Reg::INVALID_REG)
|
||||||
V0Q = fpr.GetReg();
|
V0Q = fpr.GetScopedReg();
|
||||||
inaccurate_fma_reg = reg_encoder(V0Q);
|
inaccurate_fma_reg = reg_encoder(V0Q);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -137,17 +138,17 @@ void JitArm64::ps_arith(UGeckoInstruction inst)
|
|||||||
m_accurate_nans && (VD == VA || (use_b && VD == VB) || (use_c && VD == VC));
|
m_accurate_nans && (VD == VA || (use_b && VD == VB) || (use_c && VD == VC));
|
||||||
if (need_accurate_fma_reg || preserve_d)
|
if (need_accurate_fma_reg || preserve_d)
|
||||||
{
|
{
|
||||||
V1Q = fpr.GetReg();
|
V1Q = fpr.GetScopedReg();
|
||||||
result_reg = reg_encoder(V1Q);
|
result_reg = reg_encoder(V1Q);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (m_accurate_nans)
|
if (m_accurate_nans)
|
||||||
{
|
{
|
||||||
if (V0Q == ARM64Reg::INVALID_REG)
|
if (V0Q == ARM64Reg::INVALID_REG)
|
||||||
V0Q = fpr.GetReg();
|
V0Q = fpr.GetScopedReg();
|
||||||
|
|
||||||
if (duplicated_c || VD == result_reg)
|
if (duplicated_c || VD == result_reg)
|
||||||
V2Q = fpr.GetReg();
|
V2Q = fpr.GetScopedReg();
|
||||||
}
|
}
|
||||||
|
|
||||||
switch (op5)
|
switch (op5)
|
||||||
@ -295,13 +296,7 @@ void JitArm64::ps_arith(UGeckoInstruction inst)
|
|||||||
|
|
||||||
if (m_accurate_nans)
|
if (m_accurate_nans)
|
||||||
SetJumpTarget(nan_fixup);
|
SetJumpTarget(nan_fixup);
|
||||||
|
}
|
||||||
if (V0Q != ARM64Reg::INVALID_REG)
|
|
||||||
fpr.Unlock(V0Q);
|
|
||||||
if (V1Q != ARM64Reg::INVALID_REG)
|
|
||||||
fpr.Unlock(V1Q);
|
|
||||||
if (V2Q != ARM64Reg::INVALID_REG)
|
|
||||||
fpr.Unlock(V2Q);
|
|
||||||
|
|
||||||
ASSERT_MSG(DYNA_REC, singles == singles_func(),
|
ASSERT_MSG(DYNA_REC, singles == singles_func(),
|
||||||
"Register allocation turned singles into doubles in the middle of ps_arith");
|
"Register allocation turned singles into doubles in the middle of ps_arith");
|
||||||
@ -339,12 +334,11 @@ void JitArm64::ps_sel(UGeckoInstruction inst)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
const ARM64Reg V0Q = fpr.GetReg();
|
const auto V0Q = fpr.GetScopedReg();
|
||||||
const ARM64Reg V0 = reg_encoder(V0Q);
|
const ARM64Reg V0 = reg_encoder(V0Q);
|
||||||
m_float_emit.FCMGE(size, V0, VA);
|
m_float_emit.FCMGE(size, V0, VA);
|
||||||
m_float_emit.BSL(V0, VC, VB);
|
m_float_emit.BSL(V0, VC, VB);
|
||||||
m_float_emit.MOV(VD, V0);
|
m_float_emit.MOV(VD, V0);
|
||||||
fpr.Unlock(V0Q);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
ASSERT_MSG(DYNA_REC, singles == (fpr.IsSingle(a) && fpr.IsSingle(b) && fpr.IsSingle(c)),
|
ASSERT_MSG(DYNA_REC, singles == (fpr.IsSingle(a) && fpr.IsSingle(b) && fpr.IsSingle(c)),
|
||||||
@ -375,16 +369,21 @@ void JitArm64::ps_sumX(UGeckoInstruction inst)
|
|||||||
const ARM64Reg VB = fpr.R(b, type);
|
const ARM64Reg VB = fpr.R(b, type);
|
||||||
const ARM64Reg VC = fpr.R(c, type);
|
const ARM64Reg VC = fpr.R(c, type);
|
||||||
const ARM64Reg VD = fpr.RW(d, type);
|
const ARM64Reg VD = fpr.RW(d, type);
|
||||||
const ARM64Reg V0 = fpr.GetReg();
|
|
||||||
|
{
|
||||||
|
const auto V0 = fpr.GetScopedReg();
|
||||||
|
|
||||||
m_float_emit.DUP(size, reg_encoder(V0), reg_encoder(VB), 1);
|
m_float_emit.DUP(size, reg_encoder(V0), reg_encoder(VB), 1);
|
||||||
|
|
||||||
if (m_accurate_nans)
|
if (m_accurate_nans)
|
||||||
{
|
{
|
||||||
// If the first input is NaN, set the temp register for the second input to 0. This is because:
|
// If the first input is NaN, set the temp register for the second input to 0. This is
|
||||||
|
// because:
|
||||||
//
|
//
|
||||||
// - If the second input is also NaN, setting it to 0 ensures that the first NaN will be picked.
|
// - If the second input is also NaN, setting it to 0 ensures that the first NaN will be
|
||||||
// - If only the first input is NaN, setting the second input to 0 has no effect on the result.
|
// picked.
|
||||||
|
// - If only the first input is NaN, setting the second input to 0 has no effect on the
|
||||||
|
// result.
|
||||||
//
|
//
|
||||||
// Either way, we can then do an FADD as usual, and the FADD will make the NaN quiet.
|
// Either way, we can then do an FADD as usual, and the FADD will make the NaN quiet.
|
||||||
m_float_emit.FCMP(scalar_reg_encoder(VA));
|
m_float_emit.FCMP(scalar_reg_encoder(VA));
|
||||||
@ -408,8 +407,7 @@ void JitArm64::ps_sumX(UGeckoInstruction inst)
|
|||||||
m_float_emit.FADD(scalar_reg_encoder(V0), scalar_reg_encoder(V0), scalar_reg_encoder(VA));
|
m_float_emit.FADD(scalar_reg_encoder(V0), scalar_reg_encoder(V0), scalar_reg_encoder(VA));
|
||||||
m_float_emit.INS(size, VD, 0, V0, 0);
|
m_float_emit.INS(size, VD, 0, V0, 0);
|
||||||
}
|
}
|
||||||
|
}
|
||||||
fpr.Unlock(V0);
|
|
||||||
|
|
||||||
ASSERT_MSG(DYNA_REC, singles == (fpr.IsSingle(a) && fpr.IsSingle(b) && fpr.IsSingle(c)),
|
ASSERT_MSG(DYNA_REC, singles == (fpr.IsSingle(a) && fpr.IsSingle(b) && fpr.IsSingle(c)),
|
||||||
"Register allocation turned singles into doubles in the middle of ps_sumX");
|
"Register allocation turned singles into doubles in the middle of ps_sumX");
|
||||||
|
@ -177,6 +177,59 @@ public:
|
|||||||
// Requires unlocking after done
|
// Requires unlocking after done
|
||||||
Arm64Gen::ARM64Reg GetReg();
|
Arm64Gen::ARM64Reg GetReg();
|
||||||
|
|
||||||
|
class ScopedARM64Reg
|
||||||
|
{
|
||||||
|
public:
|
||||||
|
inline ScopedARM64Reg() = default;
|
||||||
|
ScopedARM64Reg(const ScopedARM64Reg&) = delete;
|
||||||
|
explicit inline ScopedARM64Reg(Arm64RegCache& cache) : m_reg(cache.GetReg()), m_gpr(&cache) {}
|
||||||
|
inline ScopedARM64Reg(Arm64Gen::ARM64Reg reg) : m_reg(reg) {}
|
||||||
|
inline ScopedARM64Reg(ScopedARM64Reg&& scoped_reg) { *this = std::move(scoped_reg); }
|
||||||
|
inline ~ScopedARM64Reg() { Unlock(); }
|
||||||
|
|
||||||
|
inline ScopedARM64Reg& operator=(const ScopedARM64Reg&) = delete;
|
||||||
|
inline ScopedARM64Reg& operator=(Arm64Gen::ARM64Reg reg)
|
||||||
|
{
|
||||||
|
Unlock();
|
||||||
|
m_reg = reg;
|
||||||
|
return *this;
|
||||||
|
}
|
||||||
|
inline ScopedARM64Reg& operator=(ScopedARM64Reg&& scoped_reg)
|
||||||
|
{
|
||||||
|
// Taking ownership of an existing scoped register, no need to release.
|
||||||
|
m_reg = scoped_reg.m_reg;
|
||||||
|
m_gpr = scoped_reg.m_gpr;
|
||||||
|
scoped_reg.Invalidate();
|
||||||
|
return *this;
|
||||||
|
}
|
||||||
|
|
||||||
|
inline Arm64Gen::ARM64Reg GetReg() const { return m_reg; }
|
||||||
|
inline operator Arm64Gen::ARM64Reg() const { return GetReg(); }
|
||||||
|
inline void Unlock()
|
||||||
|
{
|
||||||
|
// Only unlock the register if GPR is set.
|
||||||
|
if (m_gpr != nullptr)
|
||||||
|
{
|
||||||
|
m_gpr->Unlock(m_reg);
|
||||||
|
}
|
||||||
|
Invalidate();
|
||||||
|
}
|
||||||
|
|
||||||
|
private:
|
||||||
|
inline void Invalidate()
|
||||||
|
{
|
||||||
|
m_reg = Arm64Gen::ARM64Reg::INVALID_REG;
|
||||||
|
m_gpr = nullptr;
|
||||||
|
}
|
||||||
|
|
||||||
|
Arm64Gen::ARM64Reg m_reg = Arm64Gen::ARM64Reg::INVALID_REG;
|
||||||
|
Arm64RegCache* m_gpr = nullptr;
|
||||||
|
};
|
||||||
|
|
||||||
|
// Returns a temporary register
|
||||||
|
// Unlocking is implicitly handled through RAII
|
||||||
|
inline ScopedARM64Reg GetScopedReg() { return ScopedARM64Reg(*this); }
|
||||||
|
|
||||||
void UpdateLastUsed(BitSet32 regs_used);
|
void UpdateLastUsed(BitSet32 regs_used);
|
||||||
|
|
||||||
// Get available host registers
|
// Get available host registers
|
||||||
|
@ -48,17 +48,16 @@ void JitArm64::FixGTBeforeSettingCRFieldBit(Arm64Gen::ARM64Reg reg)
|
|||||||
// if the internal representation either has bit 63 set or has all bits set to zero.
|
// if the internal representation either has bit 63 set or has all bits set to zero.
|
||||||
// If all bits are zero and we set some bit that's unrelated to GT, we need to set bit 63 so GT
|
// If all bits are zero and we set some bit that's unrelated to GT, we need to set bit 63 so GT
|
||||||
// doesn't accidentally become considered set. Gross but necessary; this can break actual games.
|
// doesn't accidentally become considered set. Gross but necessary; this can break actual games.
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
ORR(XA, reg, LogicalImm(1ULL << 63, GPRSize::B64));
|
ORR(XA, reg, LogicalImm(1ULL << 63, GPRSize::B64));
|
||||||
CMP(reg, ARM64Reg::ZR);
|
CMP(reg, ARM64Reg::ZR);
|
||||||
CSEL(reg, reg, XA, CC_NEQ);
|
CSEL(reg, reg, XA, CC_NEQ);
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::UpdateFPExceptionSummary(ARM64Reg fpscr)
|
void JitArm64::UpdateFPExceptionSummary(ARM64Reg fpscr)
|
||||||
{
|
{
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
// fpscr.VX = (fpscr & FPSCR_VX_ANY) != 0
|
// fpscr.VX = (fpscr & FPSCR_VX_ANY) != 0
|
||||||
MOVI2R(WA, FPSCR_VX_ANY);
|
MOVI2R(WA, FPSCR_VX_ANY);
|
||||||
@ -71,8 +70,6 @@ void JitArm64::UpdateFPExceptionSummary(ARM64Reg fpscr)
|
|||||||
TST(WA, fpscr, ArithOption(fpscr, ShiftType::LSR, 22));
|
TST(WA, fpscr, ArithOption(fpscr, ShiftType::LSR, 22));
|
||||||
CSET(WA, CCFlags::CC_NEQ);
|
CSET(WA, CCFlags::CC_NEQ);
|
||||||
BFI(fpscr, WA, MathUtil::IntLog2(FPSCR_FEX), 1);
|
BFI(fpscr, WA, MathUtil::IntLog2(FPSCR_FEX), 1);
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::UpdateRoundingMode()
|
void JitArm64::UpdateRoundingMode()
|
||||||
@ -135,7 +132,7 @@ void JitArm64::mcrxr(UGeckoInstruction inst)
|
|||||||
JITDISABLE(bJITSystemRegistersOff);
|
JITDISABLE(bJITSystemRegistersOff);
|
||||||
|
|
||||||
gpr.BindCRToRegister(inst.CRFD, false);
|
gpr.BindCRToRegister(inst.CRFD, false);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
ARM64Reg XB = gpr.CR(inst.CRFD);
|
ARM64Reg XB = gpr.CR(inst.CRFD);
|
||||||
ARM64Reg WB = EncodeRegTo32(XB);
|
ARM64Reg WB = EncodeRegTo32(XB);
|
||||||
@ -155,8 +152,6 @@ void JitArm64::mcrxr(UGeckoInstruction inst)
|
|||||||
// Clear XER[0-3]
|
// Clear XER[0-3]
|
||||||
static_assert(PPCSTATE_OFF(xer_ca) + 1 == PPCSTATE_OFF(xer_so_ov));
|
static_assert(PPCSTATE_OFF(xer_ca) + 1 == PPCSTATE_OFF(xer_so_ov));
|
||||||
STRH(IndexType::Unsigned, ARM64Reg::WZR, PPC_REG, PPCSTATE_OFF(xer_ca));
|
STRH(IndexType::Unsigned, ARM64Reg::WZR, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::mfsr(UGeckoInstruction inst)
|
void JitArm64::mfsr(UGeckoInstruction inst)
|
||||||
@ -186,14 +181,12 @@ void JitArm64::mfsrin(UGeckoInstruction inst)
|
|||||||
|
|
||||||
ARM64Reg RB = gpr.R(b);
|
ARM64Reg RB = gpr.R(b);
|
||||||
ARM64Reg RD = gpr.R(d);
|
ARM64Reg RD = gpr.R(d);
|
||||||
ARM64Reg index = gpr.GetReg();
|
auto index = gpr.GetScopedReg();
|
||||||
ARM64Reg addr = EncodeRegTo64(RD);
|
ARM64Reg addr = EncodeRegTo64(RD);
|
||||||
|
|
||||||
UBFM(index, RB, 28, 31);
|
UBFM(index, RB, 28, 31);
|
||||||
ADDI2R(addr, PPC_REG, PPCSTATE_OFF_SR(0), addr);
|
ADDI2R(addr, PPC_REG, PPCSTATE_OFF_SR(0), addr);
|
||||||
LDR(RD, addr, ArithOption(EncodeRegTo64(index), true));
|
LDR(RD, addr, ArithOption(EncodeRegTo64(index), true));
|
||||||
|
|
||||||
gpr.Unlock(index);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::mtsrin(UGeckoInstruction inst)
|
void JitArm64::mtsrin(UGeckoInstruction inst)
|
||||||
@ -206,14 +199,12 @@ void JitArm64::mtsrin(UGeckoInstruction inst)
|
|||||||
|
|
||||||
ARM64Reg RB = gpr.R(b);
|
ARM64Reg RB = gpr.R(b);
|
||||||
ARM64Reg RD = gpr.R(d);
|
ARM64Reg RD = gpr.R(d);
|
||||||
ARM64Reg index = gpr.GetReg();
|
auto index = gpr.GetScopedReg();
|
||||||
ARM64Reg addr = gpr.GetReg();
|
auto addr = gpr.GetScopedReg();
|
||||||
|
|
||||||
UBFM(index, RB, 28, 31);
|
UBFM(index, RB, 28, 31);
|
||||||
ADDI2R(EncodeRegTo64(addr), PPC_REG, PPCSTATE_OFF_SR(0), EncodeRegTo64(addr));
|
ADDI2R(EncodeRegTo64(addr), PPC_REG, PPCSTATE_OFF_SR(0), EncodeRegTo64(addr));
|
||||||
STR(RD, EncodeRegTo64(addr), ArithOption(EncodeRegTo64(index), true));
|
STR(RD, EncodeRegTo64(addr), ArithOption(EncodeRegTo64(index), true));
|
||||||
|
|
||||||
gpr.Unlock(index, addr);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::twx(UGeckoInstruction inst)
|
void JitArm64::twx(UGeckoInstruction inst)
|
||||||
@ -223,7 +214,7 @@ void JitArm64::twx(UGeckoInstruction inst)
|
|||||||
|
|
||||||
s32 a = inst.RA;
|
s32 a = inst.RA;
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
if (inst.OPCD == 3) // twi
|
if (inst.OPCD == 3) // twi
|
||||||
{
|
{
|
||||||
@ -278,8 +269,6 @@ void JitArm64::twx(UGeckoInstruction inst)
|
|||||||
fpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
fpr.Flush(FlushMode::All, ARM64Reg::INVALID_REG);
|
||||||
WriteExit(js.compilerPC + 4);
|
WriteExit(js.compilerPC + 4);
|
||||||
}
|
}
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::mfspr(UGeckoInstruction inst)
|
void JitArm64::mfspr(UGeckoInstruction inst)
|
||||||
@ -294,19 +283,19 @@ void JitArm64::mfspr(UGeckoInstruction inst)
|
|||||||
case SPR_TL:
|
case SPR_TL:
|
||||||
case SPR_TU:
|
case SPR_TU:
|
||||||
{
|
{
|
||||||
ARM64Reg Wg = gpr.GetReg();
|
auto Wg = gpr.GetScopedReg();
|
||||||
ARM64Reg Xg = EncodeRegTo64(Wg);
|
ARM64Reg Xg = EncodeRegTo64(Wg);
|
||||||
|
|
||||||
ARM64Reg Wresult = gpr.GetReg();
|
auto Wresult = gpr.GetScopedReg();
|
||||||
ARM64Reg Xresult = EncodeRegTo64(Wresult);
|
ARM64Reg Xresult = EncodeRegTo64(Wresult);
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WB = gpr.GetReg();
|
auto WB = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
ARM64Reg XB = EncodeRegTo64(WB);
|
ARM64Reg XB = EncodeRegTo64(WB);
|
||||||
|
|
||||||
ARM64Reg VC = fpr.GetReg();
|
auto VC = fpr.GetScopedReg();
|
||||||
ARM64Reg VD = fpr.GetReg();
|
auto VD = fpr.GetScopedReg();
|
||||||
ARM64Reg SC = EncodeRegToSingle(VC);
|
ARM64Reg SC = EncodeRegToSingle(VC);
|
||||||
ARM64Reg SD = EncodeRegToSingle(VD);
|
ARM64Reg SD = EncodeRegToSingle(VD);
|
||||||
|
|
||||||
@ -371,8 +360,6 @@ void JitArm64::mfspr(UGeckoInstruction inst)
|
|||||||
else
|
else
|
||||||
LSR(EncodeRegTo64(gpr.R(n)), Xresult, 32);
|
LSR(EncodeRegTo64(gpr.R(n)), Xresult, 32);
|
||||||
|
|
||||||
gpr.Unlock(Wg, Wresult, WA, WB);
|
|
||||||
fpr.Unlock(VC, VD);
|
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -381,22 +368,18 @@ void JitArm64::mfspr(UGeckoInstruction inst)
|
|||||||
LSR(EncodeRegTo64(gpr.R(d)), Xresult, 32);
|
LSR(EncodeRegTo64(gpr.R(d)), Xresult, 32);
|
||||||
else
|
else
|
||||||
MOV(gpr.R(d), Wresult);
|
MOV(gpr.R(d), Wresult);
|
||||||
|
|
||||||
gpr.Unlock(Wg, Wresult, WA, WB);
|
|
||||||
fpr.Unlock(VC, VD);
|
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
case SPR_XER:
|
case SPR_XER:
|
||||||
{
|
{
|
||||||
gpr.BindToRegister(d, false);
|
gpr.BindToRegister(d, false);
|
||||||
ARM64Reg RD = gpr.R(d);
|
ARM64Reg RD = gpr.R(d);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
LDRH(IndexType::Unsigned, RD, PPC_REG, PPCSTATE_OFF(xer_stringctrl));
|
LDRH(IndexType::Unsigned, RD, PPC_REG, PPCSTATE_OFF(xer_stringctrl));
|
||||||
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
ORR(RD, RD, WA, ArithOption(WA, ShiftType::LSL, XER_CA_SHIFT));
|
ORR(RD, RD, WA, ArithOption(WA, ShiftType::LSL, XER_CA_SHIFT));
|
||||||
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_so_ov));
|
LDRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_so_ov));
|
||||||
ORR(RD, RD, WA, ArithOption(WA, ShiftType::LSL, XER_OV_SHIFT));
|
ORR(RD, RD, WA, ArithOption(WA, ShiftType::LSL, XER_OV_SHIFT));
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
case SPR_WPAR:
|
case SPR_WPAR:
|
||||||
@ -462,14 +445,13 @@ void JitArm64::mtspr(UGeckoInstruction inst)
|
|||||||
case SPR_XER:
|
case SPR_XER:
|
||||||
{
|
{
|
||||||
ARM64Reg RD = gpr.R(inst.RD);
|
ARM64Reg RD = gpr.R(inst.RD);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
AND(WA, RD, LogicalImm(0xFFFFFF7F, GPRSize::B32));
|
AND(WA, RD, LogicalImm(0xFFFFFF7F, GPRSize::B32));
|
||||||
STRH(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_stringctrl));
|
STRH(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_stringctrl));
|
||||||
UBFM(WA, RD, XER_CA_SHIFT, XER_CA_SHIFT + 1);
|
UBFM(WA, RD, XER_CA_SHIFT, XER_CA_SHIFT + 1);
|
||||||
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_ca));
|
||||||
UBFM(WA, RD, XER_OV_SHIFT, 31); // Same as WA = RD >> XER_OV_SHIFT
|
UBFM(WA, RD, XER_OV_SHIFT, 31); // Same as WA = RD >> XER_OV_SHIFT
|
||||||
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_so_ov));
|
STRB(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(xer_so_ov));
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
break;
|
break;
|
||||||
default:
|
default:
|
||||||
@ -553,9 +535,10 @@ void JitArm64::crXXX(UGeckoInstruction inst)
|
|||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
ARM64Reg WB = gpr.GetReg();
|
{
|
||||||
|
auto WB = gpr.GetScopedReg();
|
||||||
ARM64Reg XB = EncodeRegTo64(WB);
|
ARM64Reg XB = EncodeRegTo64(WB);
|
||||||
|
|
||||||
// creqv or crnand or crnor
|
// creqv or crnand or crnor
|
||||||
@ -623,44 +606,41 @@ void JitArm64::crXXX(UGeckoInstruction inst)
|
|||||||
ORR(XA, XA, XB);
|
ORR(XA, XA, XB);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
|
|
||||||
// Store result bit in CRBD
|
// Store result bit in CRBD
|
||||||
int field = inst.CRBD >> 2;
|
int field = inst.CRBD >> 2;
|
||||||
int bit = 3 - (inst.CRBD & 3);
|
int bit = 3 - (inst.CRBD & 3);
|
||||||
|
|
||||||
gpr.Unlock(WB);
|
|
||||||
WB = ARM64Reg::INVALID_REG;
|
|
||||||
gpr.BindCRToRegister(field, true);
|
gpr.BindCRToRegister(field, true);
|
||||||
XB = gpr.CR(field);
|
ARM64Reg CR = gpr.CR(field);
|
||||||
|
|
||||||
if (bit != PowerPC::CR_GT_BIT)
|
if (bit != PowerPC::CR_GT_BIT)
|
||||||
FixGTBeforeSettingCRFieldBit(XB);
|
FixGTBeforeSettingCRFieldBit(CR);
|
||||||
|
|
||||||
switch (bit)
|
switch (bit)
|
||||||
{
|
{
|
||||||
case PowerPC::CR_SO_BIT: // set bit 59 to input
|
case PowerPC::CR_SO_BIT: // set bit 59 to input
|
||||||
BFI(XB, XA, PowerPC::CR_EMU_SO_BIT, 1);
|
BFI(CR, XA, PowerPC::CR_EMU_SO_BIT, 1);
|
||||||
break;
|
break;
|
||||||
|
|
||||||
case PowerPC::CR_EQ_BIT: // clear low 32 bits, set bit 0 to !input
|
case PowerPC::CR_EQ_BIT: // clear low 32 bits, set bit 0 to !input
|
||||||
AND(XB, XB, LogicalImm(0xFFFF'FFFF'0000'0000, GPRSize::B64));
|
AND(CR, CR, LogicalImm(0xFFFF'FFFF'0000'0000, GPRSize::B64));
|
||||||
EOR(XA, XA, LogicalImm(1, GPRSize::B64));
|
EOR(XA, XA, LogicalImm(1, GPRSize::B64));
|
||||||
ORR(XB, XB, XA);
|
ORR(CR, CR, XA);
|
||||||
break;
|
break;
|
||||||
|
|
||||||
case PowerPC::CR_GT_BIT: // set bit 63 to !input
|
case PowerPC::CR_GT_BIT: // set bit 63 to !input
|
||||||
EOR(XA, XA, LogicalImm(1, GPRSize::B64));
|
EOR(XA, XA, LogicalImm(1, GPRSize::B64));
|
||||||
BFI(XB, XA, 63, 1);
|
BFI(CR, XA, 63, 1);
|
||||||
break;
|
break;
|
||||||
|
|
||||||
case PowerPC::CR_LT_BIT: // set bit 62 to input
|
case PowerPC::CR_LT_BIT: // set bit 62 to input
|
||||||
BFI(XB, XA, PowerPC::CR_EMU_LT_BIT, 1);
|
BFI(CR, XA, PowerPC::CR_EMU_LT_BIT, 1);
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
ORR(XB, XB, LogicalImm(1ULL << 32, GPRSize::B64));
|
ORR(CR, CR, LogicalImm(1ULL << 32, GPRSize::B64));
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::mfcr(UGeckoInstruction inst)
|
void JitArm64::mfcr(UGeckoInstruction inst)
|
||||||
@ -670,8 +650,8 @@ void JitArm64::mfcr(UGeckoInstruction inst)
|
|||||||
|
|
||||||
gpr.BindToRegister(inst.RD, false);
|
gpr.BindToRegister(inst.RD, false);
|
||||||
ARM64Reg WA = gpr.R(inst.RD);
|
ARM64Reg WA = gpr.R(inst.RD);
|
||||||
ARM64Reg WB = gpr.GetReg();
|
auto WB = gpr.GetScopedReg();
|
||||||
ARM64Reg WC = gpr.GetReg();
|
auto WC = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
ARM64Reg XB = EncodeRegTo64(WB);
|
ARM64Reg XB = EncodeRegTo64(WB);
|
||||||
ARM64Reg XC = EncodeRegTo64(WC);
|
ARM64Reg XC = EncodeRegTo64(WC);
|
||||||
@ -716,8 +696,6 @@ void JitArm64::mfcr(UGeckoInstruction inst)
|
|||||||
else if (!js.op->crInUse[i])
|
else if (!js.op->crInUse[i])
|
||||||
gpr.StoreCRRegisters(BitSet8{i}, WC);
|
gpr.StoreCRRegisters(BitSet8{i}, WC);
|
||||||
}
|
}
|
||||||
|
|
||||||
gpr.Unlock(WB, WC);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::mtcrf(UGeckoInstruction inst)
|
void JitArm64::mtcrf(UGeckoInstruction inst)
|
||||||
@ -729,7 +707,7 @@ void JitArm64::mtcrf(UGeckoInstruction inst)
|
|||||||
if (crm != 0)
|
if (crm != 0)
|
||||||
{
|
{
|
||||||
ARM64Reg RS = gpr.R(inst.RS);
|
ARM64Reg RS = gpr.R(inst.RS);
|
||||||
ARM64Reg WB = gpr.GetReg();
|
auto WB = gpr.GetScopedReg();
|
||||||
ARM64Reg XB = EncodeRegTo64(WB);
|
ARM64Reg XB = EncodeRegTo64(WB);
|
||||||
MOVP2R(XB, PowerPC::ConditionRegister::s_crTable.data());
|
MOVP2R(XB, PowerPC::ConditionRegister::s_crTable.data());
|
||||||
for (int i = 0; i < 8; ++i)
|
for (int i = 0; i < 8; ++i)
|
||||||
@ -753,7 +731,6 @@ void JitArm64::mtcrf(UGeckoInstruction inst)
|
|||||||
LDR(CR, XB, ArithOption(CR, true));
|
LDR(CR, XB, ArithOption(CR, true));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -771,7 +748,7 @@ void JitArm64::mcrfs(UGeckoInstruction inst)
|
|||||||
|
|
||||||
gpr.BindCRToRegister(field, false);
|
gpr.BindCRToRegister(field, false);
|
||||||
ARM64Reg CR = gpr.CR(field);
|
ARM64Reg CR = gpr.CR(field);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WCR = EncodeRegTo32(CR);
|
ARM64Reg WCR = EncodeRegTo32(CR);
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
|
|
||||||
@ -789,8 +766,6 @@ void JitArm64::mcrfs(UGeckoInstruction inst)
|
|||||||
|
|
||||||
MOVP2R(XA, PowerPC::ConditionRegister::s_crTable.data());
|
MOVP2R(XA, PowerPC::ConditionRegister::s_crTable.data());
|
||||||
LDR(CR, XA, ArithOption(CR, true));
|
LDR(CR, XA, ArithOption(CR, true));
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::mffsx(UGeckoInstruction inst)
|
void JitArm64::mffsx(UGeckoInstruction inst)
|
||||||
@ -799,7 +774,7 @@ void JitArm64::mffsx(UGeckoInstruction inst)
|
|||||||
JITDISABLE(bJITSystemRegistersOff);
|
JITDISABLE(bJITSystemRegistersOff);
|
||||||
FALLBACK_IF(inst.Rc);
|
FALLBACK_IF(inst.Rc);
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg XA = EncodeRegTo64(WA);
|
ARM64Reg XA = EncodeRegTo64(WA);
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
@ -808,8 +783,6 @@ void JitArm64::mffsx(UGeckoInstruction inst)
|
|||||||
|
|
||||||
ORR(XA, XA, LogicalImm(0xFFF8'0000'0000'0000, GPRSize::B64));
|
ORR(XA, XA, LogicalImm(0xFFF8'0000'0000'0000, GPRSize::B64));
|
||||||
m_float_emit.FMOV(EncodeRegToDouble(VD), XA);
|
m_float_emit.FMOV(EncodeRegToDouble(VD), XA);
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void JitArm64::mtfsb0x(UGeckoInstruction inst)
|
void JitArm64::mtfsb0x(UGeckoInstruction inst)
|
||||||
@ -824,7 +797,8 @@ void JitArm64::mtfsb0x(UGeckoInstruction inst)
|
|||||||
if (mask == FPSCR_FEX || mask == FPSCR_VX)
|
if (mask == FPSCR_FEX || mask == FPSCR_VX)
|
||||||
return;
|
return;
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
|
||||||
@ -833,8 +807,7 @@ void JitArm64::mtfsb0x(UGeckoInstruction inst)
|
|||||||
if ((mask & (FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
if ((mask & (FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
||||||
UpdateFPExceptionSummary(WA);
|
UpdateFPExceptionSummary(WA);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
}
|
||||||
gpr.Unlock(WA);
|
|
||||||
|
|
||||||
if (inst.CRBD >= 29)
|
if (inst.CRBD >= 29)
|
||||||
UpdateRoundingMode();
|
UpdateRoundingMode();
|
||||||
@ -852,25 +825,24 @@ void JitArm64::mtfsb1x(UGeckoInstruction inst)
|
|||||||
if (mask == FPSCR_FEX || mask == FPSCR_VX)
|
if (mask == FPSCR_FEX || mask == FPSCR_VX)
|
||||||
return;
|
return;
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
|
||||||
if ((mask & FPSCR_ANY_X) != 0)
|
if ((mask & FPSCR_ANY_X) != 0)
|
||||||
{
|
{
|
||||||
ARM64Reg WB = gpr.GetReg();
|
auto WB = gpr.GetScopedReg();
|
||||||
TST(WA, LogicalImm(mask, GPRSize::B32));
|
TST(WA, LogicalImm(mask, GPRSize::B32));
|
||||||
ORR(WB, WA, LogicalImm(1 << 31, GPRSize::B32));
|
ORR(WB, WA, LogicalImm(1 << 31, GPRSize::B32));
|
||||||
CSEL(WA, WA, WB, CCFlags::CC_NEQ);
|
CSEL(WA, WA, WB, CCFlags::CC_NEQ);
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
ORR(WA, WA, LogicalImm(mask, GPRSize::B32));
|
ORR(WA, WA, LogicalImm(mask, GPRSize::B32));
|
||||||
|
|
||||||
if ((mask & (FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
if ((mask & (FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
||||||
UpdateFPExceptionSummary(WA);
|
UpdateFPExceptionSummary(WA);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
}
|
||||||
gpr.Unlock(WA);
|
|
||||||
|
|
||||||
if (inst.CRBD >= 29)
|
if (inst.CRBD >= 29)
|
||||||
UpdateRoundingMode();
|
UpdateRoundingMode();
|
||||||
@ -887,7 +859,8 @@ void JitArm64::mtfsfix(UGeckoInstruction inst)
|
|||||||
u8 shift = 28 - 4 * inst.CRFD;
|
u8 shift = 28 - 4 * inst.CRFD;
|
||||||
u32 mask = 0xF << shift;
|
u32 mask = 0xF << shift;
|
||||||
|
|
||||||
ARM64Reg WA = gpr.GetReg();
|
{
|
||||||
|
auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
|
||||||
@ -902,17 +875,15 @@ void JitArm64::mtfsfix(UGeckoInstruction inst)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
ARM64Reg WB = gpr.GetReg();
|
auto WB = gpr.GetScopedReg();
|
||||||
MOVZ(WB, imm);
|
MOVZ(WB, imm);
|
||||||
BFI(WA, WB, shift, 4);
|
BFI(WA, WB, shift, 4);
|
||||||
gpr.Unlock(WB);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if ((mask & (FPSCR_FEX | FPSCR_VX | FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
if ((mask & (FPSCR_FEX | FPSCR_VX | FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
||||||
UpdateFPExceptionSummary(WA);
|
UpdateFPExceptionSummary(WA);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
}
|
||||||
gpr.Unlock(WA);
|
|
||||||
|
|
||||||
// Field 7 contains NI and RN.
|
// Field 7 contains NI and RN.
|
||||||
if (inst.CRFD == 7)
|
if (inst.CRFD == 7)
|
||||||
@ -936,20 +907,19 @@ void JitArm64::mtfsfx(UGeckoInstruction inst)
|
|||||||
if (mask == 0xFFFFFFFF)
|
if (mask == 0xFFFFFFFF)
|
||||||
{
|
{
|
||||||
ARM64Reg VB = fpr.R(inst.FB, RegType::LowerPair);
|
ARM64Reg VB = fpr.R(inst.FB, RegType::LowerPair);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
|
|
||||||
m_float_emit.FMOV(WA, EncodeRegToSingle(VB));
|
m_float_emit.FMOV(WA, EncodeRegToSingle(VB));
|
||||||
|
|
||||||
UpdateFPExceptionSummary(WA);
|
UpdateFPExceptionSummary(WA);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
else if (mask != 0)
|
else if (mask != 0)
|
||||||
{
|
{
|
||||||
ARM64Reg VB = fpr.R(inst.FB, RegType::LowerPair);
|
ARM64Reg VB = fpr.R(inst.FB, RegType::LowerPair);
|
||||||
ARM64Reg WA = gpr.GetReg();
|
auto WA = gpr.GetScopedReg();
|
||||||
ARM64Reg WB = gpr.GetReg();
|
{
|
||||||
|
auto WB = gpr.GetScopedReg();
|
||||||
|
|
||||||
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
LDR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
m_float_emit.FMOV(WB, EncodeRegToSingle(VB));
|
m_float_emit.FMOV(WB, EncodeRegToSingle(VB));
|
||||||
@ -962,23 +932,18 @@ void JitArm64::mtfsfx(UGeckoInstruction inst)
|
|||||||
}
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
ARM64Reg WC = gpr.GetReg();
|
auto WC = gpr.GetScopedReg();
|
||||||
|
|
||||||
MOVI2R(WC, mask);
|
MOVI2R(WC, mask);
|
||||||
BIC(WA, WA, WC);
|
BIC(WA, WA, WC);
|
||||||
AND(WB, WB, WC);
|
AND(WB, WB, WC);
|
||||||
|
|
||||||
gpr.Unlock(WC);
|
|
||||||
}
|
}
|
||||||
ORR(WA, WA, WB);
|
ORR(WA, WA, WB);
|
||||||
|
}
|
||||||
gpr.Unlock(WB);
|
|
||||||
|
|
||||||
if ((mask & (FPSCR_FEX | FPSCR_VX | FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
if ((mask & (FPSCR_FEX | FPSCR_VX | FPSCR_ANY_X | FPSCR_ANY_E)) != 0)
|
||||||
UpdateFPExceptionSummary(WA);
|
UpdateFPExceptionSummary(WA);
|
||||||
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
STR(IndexType::Unsigned, WA, PPC_REG, PPCSTATE_OFF(fpscr));
|
||||||
|
|
||||||
gpr.Unlock(WA);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
if (inst.FM & 1)
|
if (inst.FM & 1)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user