e2358af5ef
Smaller codesize.
153 lines
5.1 KiB
C++
153 lines
5.1 KiB
C++
// Copyright (C) 2003 Dolphin Project.
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, version 2.0 or later versions.
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License 2.0 for more details.
|
|
|
|
// A copy of the GPL 2.0 should have been included with the program.
|
|
// If not, see http://www.gnu.org/licenses/
|
|
|
|
// 24th August 2016: This code was modified for Dynarmic.
|
|
|
|
#include <algorithm>
|
|
#include <vector>
|
|
|
|
#include <xbyak.h>
|
|
|
|
#include "backend/x64/abi.h"
|
|
#include "backend/x64/block_of_code.h"
|
|
#include "common/common_types.h"
|
|
#include "common/iterator_util.h"
|
|
|
|
namespace Dynarmic::BackendX64 {
|
|
|
|
constexpr size_t GPR_SIZE = 8;
|
|
constexpr size_t XMM_SIZE = 16;
|
|
|
|
struct FrameInfo {
|
|
size_t stack_subtraction = 0;
|
|
size_t xmm_offset = 0;
|
|
};
|
|
|
|
static FrameInfo CalculateFrameInfo(size_t num_gprs, size_t num_xmms, size_t frame_size) {
|
|
FrameInfo frame_info = {};
|
|
|
|
size_t rsp_alignment = 8; // We are always 8-byte aligned initially
|
|
rsp_alignment -= num_gprs * GPR_SIZE;
|
|
|
|
if (num_xmms > 0) {
|
|
frame_info.stack_subtraction = rsp_alignment & 0xF;
|
|
frame_info.stack_subtraction += num_xmms * XMM_SIZE;
|
|
}
|
|
|
|
size_t xmm_base = frame_info.stack_subtraction;
|
|
|
|
frame_info.stack_subtraction += frame_size;
|
|
frame_info.stack_subtraction += ABI_SHADOW_SPACE;
|
|
|
|
rsp_alignment -= frame_info.stack_subtraction;
|
|
frame_info.stack_subtraction += rsp_alignment & 0xF;
|
|
|
|
frame_info.xmm_offset = frame_info.stack_subtraction - xmm_base;
|
|
|
|
return frame_info;
|
|
}
|
|
|
|
template<typename RegisterArrayT>
|
|
void ABI_PushRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size, const RegisterArrayT& regs) {
|
|
using namespace Xbyak::util;
|
|
|
|
const size_t num_gprs = std::count_if(regs.begin(), regs.end(), HostLocIsGPR);
|
|
const size_t num_xmms = std::count_if(regs.begin(), regs.end(), HostLocIsXMM);
|
|
|
|
FrameInfo frame_info = CalculateFrameInfo(num_gprs, num_xmms, frame_size);
|
|
|
|
for (HostLoc gpr : regs) {
|
|
if (HostLocIsGPR(gpr)) {
|
|
code.push(HostLocToReg64(gpr));
|
|
}
|
|
}
|
|
|
|
if (frame_info.stack_subtraction != 0) {
|
|
code.sub(rsp, u32(frame_info.stack_subtraction));
|
|
}
|
|
|
|
size_t xmm_offset = frame_info.xmm_offset;
|
|
for (HostLoc xmm : regs) {
|
|
if (HostLocIsXMM(xmm)) {
|
|
if (code.DoesCpuSupport(Xbyak::util::Cpu::tAVX)) {
|
|
code.vmovaps(code.xword[rsp + xmm_offset], HostLocToXmm(xmm));
|
|
} else {
|
|
code.movaps(code.xword[rsp + xmm_offset], HostLocToXmm(xmm));
|
|
}
|
|
xmm_offset += XMM_SIZE;
|
|
}
|
|
}
|
|
}
|
|
|
|
template<typename RegisterArrayT>
|
|
void ABI_PopRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size, const RegisterArrayT& regs) {
|
|
using namespace Xbyak::util;
|
|
|
|
const size_t num_gprs = std::count_if(regs.begin(), regs.end(), HostLocIsGPR);
|
|
const size_t num_xmms = std::count_if(regs.begin(), regs.end(), HostLocIsXMM);
|
|
|
|
FrameInfo frame_info = CalculateFrameInfo(num_gprs, num_xmms, frame_size);
|
|
|
|
size_t xmm_offset = frame_info.xmm_offset;
|
|
for (HostLoc xmm : regs) {
|
|
if (HostLocIsXMM(xmm)) {
|
|
if (code.DoesCpuSupport(Xbyak::util::Cpu::tAVX)) {
|
|
code.vmovaps(HostLocToXmm(xmm), code.xword[rsp + xmm_offset]);
|
|
} else {
|
|
code.movaps(HostLocToXmm(xmm), code.xword[rsp + xmm_offset]);
|
|
}
|
|
xmm_offset += XMM_SIZE;
|
|
}
|
|
}
|
|
|
|
if (frame_info.stack_subtraction != 0) {
|
|
code.add(rsp, u32(frame_info.stack_subtraction));
|
|
}
|
|
|
|
for (HostLoc gpr : Common::Reverse(regs)) {
|
|
if (HostLocIsGPR(gpr)) {
|
|
code.pop(HostLocToReg64(gpr));
|
|
}
|
|
}
|
|
}
|
|
|
|
void ABI_PushCalleeSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) {
|
|
ABI_PushRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLEE_SAVE);
|
|
}
|
|
|
|
void ABI_PopCalleeSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) {
|
|
ABI_PopRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLEE_SAVE);
|
|
}
|
|
|
|
void ABI_PushCallerSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) {
|
|
ABI_PushRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLER_SAVE);
|
|
}
|
|
|
|
void ABI_PopCallerSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) {
|
|
ABI_PopRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLER_SAVE);
|
|
}
|
|
|
|
void ABI_PushCallerSaveRegistersAndAdjustStackExcept(BlockOfCode& code, HostLoc exception) {
|
|
std::vector<HostLoc> regs;
|
|
std::remove_copy(ABI_ALL_CALLER_SAVE.begin(), ABI_ALL_CALLER_SAVE.end(), std::back_inserter(regs), exception);
|
|
ABI_PushRegistersAndAdjustStack(code, 0, regs);
|
|
}
|
|
|
|
void ABI_PopCallerSaveRegistersAndAdjustStackExcept(BlockOfCode& code, HostLoc exception) {
|
|
std::vector<HostLoc> regs;
|
|
std::remove_copy(ABI_ALL_CALLER_SAVE.begin(), ABI_ALL_CALLER_SAVE.end(), std::back_inserter(regs), exception);
|
|
ABI_PopRegistersAndAdjustStack(code, 0, regs);
|
|
}
|
|
|
|
} // namespace Dynarmic::BackendX64
|