// Copyright (C) 2003 Dolphin Project. // This program is free software: you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation, version 2.0 or later versions. // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License 2.0 for more details. // A copy of the GPL 2.0 should have been included with the program. // If not, see http://www.gnu.org/licenses/ // 24th August 2016: This code was modified for Dynarmic. #include #include #include #include "backend/x64/abi.h" #include "backend/x64/block_of_code.h" #include "common/common_types.h" #include "common/iterator_util.h" namespace Dynarmic::BackendX64 { constexpr size_t GPR_SIZE = 8; constexpr size_t XMM_SIZE = 16; struct FrameInfo { size_t stack_subtraction = 0; size_t xmm_offset = 0; }; static FrameInfo CalculateFrameInfo(size_t num_gprs, size_t num_xmms, size_t frame_size) { FrameInfo frame_info = {}; size_t rsp_alignment = 8; // We are always 8-byte aligned initially rsp_alignment -= num_gprs * GPR_SIZE; if (num_xmms > 0) { frame_info.stack_subtraction = rsp_alignment & 0xF; frame_info.stack_subtraction += num_xmms * XMM_SIZE; } size_t xmm_base = frame_info.stack_subtraction; frame_info.stack_subtraction += frame_size; frame_info.stack_subtraction += ABI_SHADOW_SPACE; rsp_alignment -= frame_info.stack_subtraction; frame_info.stack_subtraction += rsp_alignment & 0xF; frame_info.xmm_offset = frame_info.stack_subtraction - xmm_base; return frame_info; } template void ABI_PushRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size, const RegisterArrayT& regs) { using namespace Xbyak::util; const size_t num_gprs = std::count_if(regs.begin(), regs.end(), HostLocIsGPR); const size_t num_xmms = std::count_if(regs.begin(), regs.end(), HostLocIsXMM); FrameInfo frame_info = CalculateFrameInfo(num_gprs, num_xmms, frame_size); for (HostLoc gpr : regs) { if (HostLocIsGPR(gpr)) { code.push(HostLocToReg64(gpr)); } } if (frame_info.stack_subtraction != 0) { code.sub(rsp, u32(frame_info.stack_subtraction)); } size_t xmm_offset = frame_info.xmm_offset; for (HostLoc xmm : regs) { if (HostLocIsXMM(xmm)) { if (code.DoesCpuSupport(Xbyak::util::Cpu::tAVX)) { code.vmovaps(code.xword[rsp + xmm_offset], HostLocToXmm(xmm)); } else { code.movaps(code.xword[rsp + xmm_offset], HostLocToXmm(xmm)); } xmm_offset += XMM_SIZE; } } } template void ABI_PopRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size, const RegisterArrayT& regs) { using namespace Xbyak::util; const size_t num_gprs = std::count_if(regs.begin(), regs.end(), HostLocIsGPR); const size_t num_xmms = std::count_if(regs.begin(), regs.end(), HostLocIsXMM); FrameInfo frame_info = CalculateFrameInfo(num_gprs, num_xmms, frame_size); size_t xmm_offset = frame_info.xmm_offset; for (HostLoc xmm : regs) { if (HostLocIsXMM(xmm)) { if (code.DoesCpuSupport(Xbyak::util::Cpu::tAVX)) { code.vmovaps(HostLocToXmm(xmm), code.xword[rsp + xmm_offset]); } else { code.movaps(HostLocToXmm(xmm), code.xword[rsp + xmm_offset]); } xmm_offset += XMM_SIZE; } } if (frame_info.stack_subtraction != 0) { code.add(rsp, u32(frame_info.stack_subtraction)); } for (HostLoc gpr : Common::Reverse(regs)) { if (HostLocIsGPR(gpr)) { code.pop(HostLocToReg64(gpr)); } } } void ABI_PushCalleeSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) { ABI_PushRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLEE_SAVE); } void ABI_PopCalleeSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) { ABI_PopRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLEE_SAVE); } void ABI_PushCallerSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) { ABI_PushRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLER_SAVE); } void ABI_PopCallerSaveRegistersAndAdjustStack(BlockOfCode& code, size_t frame_size) { ABI_PopRegistersAndAdjustStack(code, frame_size, ABI_ALL_CALLER_SAVE); } void ABI_PushCallerSaveRegistersAndAdjustStackExcept(BlockOfCode& code, HostLoc exception) { std::vector regs; std::remove_copy(ABI_ALL_CALLER_SAVE.begin(), ABI_ALL_CALLER_SAVE.end(), std::back_inserter(regs), exception); ABI_PushRegistersAndAdjustStack(code, 0, regs); } void ABI_PopCallerSaveRegistersAndAdjustStackExcept(BlockOfCode& code, HostLoc exception) { std::vector regs; std::remove_copy(ABI_ALL_CALLER_SAVE.begin(), ABI_ALL_CALLER_SAVE.end(), std::back_inserter(regs), exception); ABI_PopRegistersAndAdjustStack(code, 0, regs); } } // namespace Dynarmic::BackendX64