emit_arm64_a32: Improve A32SetCpsr
This commit is contained in:
parent
ad6a04c584
commit
97edb626c7
1 changed files with 43 additions and 9 deletions
|
@ -311,20 +311,54 @@ void EmitIR<IR::Opcode::A32GetCpsr>(oaknut::CodeGenerator& code, EmitContext& ct
|
||||||
code.ORR(Wcpsr, Wcpsr, Wscratch0, LSL, 5);
|
code.ORR(Wcpsr, Wcpsr, Wscratch0, LSL, 5);
|
||||||
}
|
}
|
||||||
|
|
||||||
static void SetCpsrImpl(u32 value, A32JitState* jit_state) {
|
|
||||||
jit_state->SetCpsr(value);
|
|
||||||
}
|
|
||||||
|
|
||||||
template<>
|
template<>
|
||||||
void EmitIR<IR::Opcode::A32SetCpsr>(oaknut::CodeGenerator& code, EmitContext& ctx, IR::Inst* inst) {
|
void EmitIR<IR::Opcode::A32SetCpsr>(oaknut::CodeGenerator& code, EmitContext& ctx, IR::Inst* inst) {
|
||||||
auto args = ctx.reg_alloc.GetArgumentInfo(inst);
|
auto args = ctx.reg_alloc.GetArgumentInfo(inst);
|
||||||
ctx.reg_alloc.PrepareForCall(nullptr, args[0]);
|
auto Wcpsr = ctx.reg_alloc.ReadW(args[0]);
|
||||||
|
RegAlloc::Realize(Wcpsr);
|
||||||
|
|
||||||
// TODO: Inline
|
// NZCV, Q flags
|
||||||
|
code.AND(Wscratch0, Wcpsr, 0xF0000000);
|
||||||
|
code.AND(Wscratch1, Wcpsr, 1 << 27);
|
||||||
|
|
||||||
code.MOV(X1, Xstate);
|
static_assert(offsetof(A32JitState, cpsr_nzcv) + sizeof(u32) == offsetof(A32JitState, cpsr_q));
|
||||||
code.MOV(Xscratch0, reinterpret_cast<u64>(&SetCpsrImpl));
|
code.STP(Wscratch0, Wscratch1, Xstate, offsetof(A32JitState, cpsr_nzcv));
|
||||||
code.BLR(Xscratch0);
|
|
||||||
|
// GE flags
|
||||||
|
// this does the following:
|
||||||
|
// cpsr_ge |= mcl::bit::get_bit<19>(cpsr) ? 0xFF000000 : 0;
|
||||||
|
// cpsr_ge |= mcl::bit::get_bit<18>(cpsr) ? 0x00FF0000 : 0;
|
||||||
|
// cpsr_ge |= mcl::bit::get_bit<17>(cpsr) ? 0x0000FF00 : 0;
|
||||||
|
// cpsr_ge |= mcl::bit::get_bit<16>(cpsr) ? 0x000000FF : 0;
|
||||||
|
code.UBFX(Wscratch0, Wcpsr, 16, 4);
|
||||||
|
code.MOV(Wscratch1, 0x00204081);
|
||||||
|
code.MUL(Wscratch0, Wscratch0, Wscratch1);
|
||||||
|
code.AND(Wscratch0, Wscratch0, 0x01010101);
|
||||||
|
code.LSL(Wscratch1, Wscratch0, 8);
|
||||||
|
code.SUB(Wscratch0, Wscratch1, Wscratch0);
|
||||||
|
|
||||||
|
// Other flags
|
||||||
|
code.MOV(Wscratch1, 0x010001DF);
|
||||||
|
code.AND(Wscratch1, Wcpsr, Wscratch1);
|
||||||
|
|
||||||
|
static_assert(offsetof(A32JitState, cpsr_jaifm) + sizeof(u32) == offsetof(A32JitState, cpsr_ge));
|
||||||
|
code.STP(Wscratch1, Wscratch0, Xstate, offsetof(A32JitState, cpsr_jaifm));
|
||||||
|
|
||||||
|
// IT state
|
||||||
|
code.AND(Wscratch0, Wcpsr, 0xFC00);
|
||||||
|
code.LSR(Wscratch1, Wcpsr, 17);
|
||||||
|
code.AND(Wscratch1, Wscratch1, 0x300);
|
||||||
|
code.ORR(Wscratch0, Wscratch0, Wscratch1);
|
||||||
|
|
||||||
|
// E flag, T flag
|
||||||
|
code.LSR(Wscratch1, Wcpsr, 8);
|
||||||
|
code.AND(Wscratch1, Wscratch1, 0x2);
|
||||||
|
code.ORR(Wscratch0, Wscratch0, Wscratch1);
|
||||||
|
code.LDR(Wscratch1, Xstate, offsetof(A32JitState, upper_location_descriptor));
|
||||||
|
code.BFXIL(Wscratch0, Wcpsr, 5, 1);
|
||||||
|
code.AND(Wscratch1, Wscratch1, 0xFFFF0000);
|
||||||
|
code.ORR(Wscratch0, Wscratch0, Wscratch1);
|
||||||
|
code.STR(Wscratch0, Xstate, offsetof(A32JitState, upper_location_descriptor));
|
||||||
}
|
}
|
||||||
|
|
||||||
template<>
|
template<>
|
||||||
|
|
Loading…
Reference in a new issue