cdb240f3d4
[REUSE] is a specification that aims at making file copyright information consistent, so that it can be both human and machine readable. It basically requires that all files have a header containing copyright and licensing information. When this isn't possible, like when dealing with binary assets, generated files or embedded third-party dependencies, it is permitted to insert copyright information in the `.reuse/dep5` file. Oh, and it also requires that all the licenses used in the project are present in the `LICENSES` folder, that's why the diff is so huge. This can be done automatically with `reuse download --all`. The `reuse` tool also contains a handy subcommand that analyzes the project and tells whether or not the project is (still) compliant, `reuse lint`. Following REUSE has a few advantages over the current approach: - Copyright information is easy to access for users / downstream - Files like `dist/license.md` do not need to exist anymore, as `.reuse/dep5` is used instead - `reuse lint` makes it easy to ensure that copyright information of files like binary assets / images is always accurate and up to date To add copyright information of files that didn't have it I looked up who committed what and when, for each file. As yuzu contributors do not have to sign a CLA or similar I couldn't assume that copyright ownership was of the "yuzu Emulator Project", so I used the name and/or email of the commit author instead. [REUSE]: https://reuse.software Follow-up to 01cf05bc75b1e47beb08937439f3ed9339e7b254
229 lines
6.4 KiB
C++
229 lines
6.4 KiB
C++
// SPDX-FileCopyrightText: 2016 Citra Emulator Project
|
|
// SPDX-License-Identifier: GPL-2.0-or-later
|
|
|
|
#pragma once
|
|
|
|
#include <bitset>
|
|
#include <initializer_list>
|
|
#include <xbyak/xbyak.h>
|
|
#include "common/assert.h"
|
|
|
|
namespace Common::X64 {
|
|
|
|
constexpr size_t RegToIndex(const Xbyak::Reg& reg) {
|
|
using Kind = Xbyak::Reg::Kind;
|
|
ASSERT_MSG((reg.getKind() & (Kind::REG | Kind::XMM)) != 0,
|
|
"RegSet only support GPRs and XMM registers.");
|
|
ASSERT_MSG(reg.getIdx() < 16, "RegSet only supports XXM0-15.");
|
|
return static_cast<size_t>(reg.getIdx()) + (reg.getKind() == Kind::REG ? 0 : 16);
|
|
}
|
|
|
|
constexpr Xbyak::Reg64 IndexToReg64(size_t reg_index) {
|
|
ASSERT(reg_index < 16);
|
|
return Xbyak::Reg64(static_cast<int>(reg_index));
|
|
}
|
|
|
|
constexpr Xbyak::Xmm IndexToXmm(size_t reg_index) {
|
|
ASSERT(reg_index >= 16 && reg_index < 32);
|
|
return Xbyak::Xmm(static_cast<int>(reg_index - 16));
|
|
}
|
|
|
|
constexpr Xbyak::Reg IndexToReg(size_t reg_index) {
|
|
if (reg_index < 16) {
|
|
return IndexToReg64(reg_index);
|
|
} else {
|
|
return IndexToXmm(reg_index);
|
|
}
|
|
}
|
|
|
|
constexpr std::bitset<32> BuildRegSet(std::initializer_list<Xbyak::Reg> regs) {
|
|
size_t bits = 0;
|
|
for (const Xbyak::Reg& reg : regs) {
|
|
bits |= size_t{1} << RegToIndex(reg);
|
|
}
|
|
return {bits};
|
|
}
|
|
|
|
constexpr inline std::bitset<32> ABI_ALL_GPRS(0x0000FFFF);
|
|
constexpr inline std::bitset<32> ABI_ALL_XMMS(0xFFFF0000);
|
|
|
|
#ifdef _WIN32
|
|
|
|
// Microsoft x64 ABI
|
|
constexpr inline Xbyak::Reg ABI_RETURN = Xbyak::util::rax;
|
|
constexpr inline Xbyak::Reg ABI_PARAM1 = Xbyak::util::rcx;
|
|
constexpr inline Xbyak::Reg ABI_PARAM2 = Xbyak::util::rdx;
|
|
constexpr inline Xbyak::Reg ABI_PARAM3 = Xbyak::util::r8;
|
|
constexpr inline Xbyak::Reg ABI_PARAM4 = Xbyak::util::r9;
|
|
|
|
constexpr inline std::bitset<32> ABI_ALL_CALLER_SAVED = BuildRegSet({
|
|
// GPRs
|
|
Xbyak::util::rcx,
|
|
Xbyak::util::rdx,
|
|
Xbyak::util::r8,
|
|
Xbyak::util::r9,
|
|
Xbyak::util::r10,
|
|
Xbyak::util::r11,
|
|
// XMMs
|
|
Xbyak::util::xmm0,
|
|
Xbyak::util::xmm1,
|
|
Xbyak::util::xmm2,
|
|
Xbyak::util::xmm3,
|
|
Xbyak::util::xmm4,
|
|
Xbyak::util::xmm5,
|
|
});
|
|
|
|
constexpr inline std::bitset<32> ABI_ALL_CALLEE_SAVED = BuildRegSet({
|
|
// GPRs
|
|
Xbyak::util::rbx,
|
|
Xbyak::util::rsi,
|
|
Xbyak::util::rdi,
|
|
Xbyak::util::rbp,
|
|
Xbyak::util::r12,
|
|
Xbyak::util::r13,
|
|
Xbyak::util::r14,
|
|
Xbyak::util::r15,
|
|
// XMMs
|
|
Xbyak::util::xmm6,
|
|
Xbyak::util::xmm7,
|
|
Xbyak::util::xmm8,
|
|
Xbyak::util::xmm9,
|
|
Xbyak::util::xmm10,
|
|
Xbyak::util::xmm11,
|
|
Xbyak::util::xmm12,
|
|
Xbyak::util::xmm13,
|
|
Xbyak::util::xmm14,
|
|
Xbyak::util::xmm15,
|
|
});
|
|
|
|
constexpr size_t ABI_SHADOW_SPACE = 0x20;
|
|
|
|
#else
|
|
|
|
// System V x86-64 ABI
|
|
constexpr inline Xbyak::Reg ABI_RETURN = Xbyak::util::rax;
|
|
constexpr inline Xbyak::Reg ABI_PARAM1 = Xbyak::util::rdi;
|
|
constexpr inline Xbyak::Reg ABI_PARAM2 = Xbyak::util::rsi;
|
|
constexpr inline Xbyak::Reg ABI_PARAM3 = Xbyak::util::rdx;
|
|
constexpr inline Xbyak::Reg ABI_PARAM4 = Xbyak::util::rcx;
|
|
|
|
constexpr inline std::bitset<32> ABI_ALL_CALLER_SAVED = BuildRegSet({
|
|
// GPRs
|
|
Xbyak::util::rcx,
|
|
Xbyak::util::rdx,
|
|
Xbyak::util::rdi,
|
|
Xbyak::util::rsi,
|
|
Xbyak::util::r8,
|
|
Xbyak::util::r9,
|
|
Xbyak::util::r10,
|
|
Xbyak::util::r11,
|
|
// XMMs
|
|
Xbyak::util::xmm0,
|
|
Xbyak::util::xmm1,
|
|
Xbyak::util::xmm2,
|
|
Xbyak::util::xmm3,
|
|
Xbyak::util::xmm4,
|
|
Xbyak::util::xmm5,
|
|
Xbyak::util::xmm6,
|
|
Xbyak::util::xmm7,
|
|
Xbyak::util::xmm8,
|
|
Xbyak::util::xmm9,
|
|
Xbyak::util::xmm10,
|
|
Xbyak::util::xmm11,
|
|
Xbyak::util::xmm12,
|
|
Xbyak::util::xmm13,
|
|
Xbyak::util::xmm14,
|
|
Xbyak::util::xmm15,
|
|
});
|
|
|
|
constexpr inline std::bitset<32> ABI_ALL_CALLEE_SAVED = BuildRegSet({
|
|
// GPRs
|
|
Xbyak::util::rbx,
|
|
Xbyak::util::rbp,
|
|
Xbyak::util::r12,
|
|
Xbyak::util::r13,
|
|
Xbyak::util::r14,
|
|
Xbyak::util::r15,
|
|
});
|
|
|
|
constexpr size_t ABI_SHADOW_SPACE = 0;
|
|
|
|
#endif
|
|
|
|
struct ABIFrameInfo {
|
|
s32 subtraction;
|
|
s32 xmm_offset;
|
|
};
|
|
|
|
inline ABIFrameInfo ABI_CalculateFrameSize(std::bitset<32> regs, size_t rsp_alignment,
|
|
size_t needed_frame_size) {
|
|
const auto count = (regs & ABI_ALL_GPRS).count();
|
|
rsp_alignment -= count * 8;
|
|
size_t subtraction = 0;
|
|
const auto xmm_count = (regs & ABI_ALL_XMMS).count();
|
|
if (xmm_count) {
|
|
// If we have any XMMs to save, we must align the stack here.
|
|
subtraction = rsp_alignment & 0xF;
|
|
}
|
|
subtraction += 0x10 * xmm_count;
|
|
size_t xmm_base_subtraction = subtraction;
|
|
subtraction += needed_frame_size;
|
|
subtraction += ABI_SHADOW_SPACE;
|
|
// Final alignment.
|
|
rsp_alignment -= subtraction;
|
|
subtraction += rsp_alignment & 0xF;
|
|
|
|
return ABIFrameInfo{static_cast<s32>(subtraction),
|
|
static_cast<s32>(subtraction - xmm_base_subtraction)};
|
|
}
|
|
|
|
inline size_t ABI_PushRegistersAndAdjustStack(Xbyak::CodeGenerator& code, std::bitset<32> regs,
|
|
size_t rsp_alignment, size_t needed_frame_size = 0) {
|
|
auto frame_info = ABI_CalculateFrameSize(regs, rsp_alignment, needed_frame_size);
|
|
|
|
for (size_t i = 0; i < regs.size(); ++i) {
|
|
if (regs[i] && ABI_ALL_GPRS[i]) {
|
|
code.push(IndexToReg64(i));
|
|
}
|
|
}
|
|
|
|
if (frame_info.subtraction != 0) {
|
|
code.sub(code.rsp, frame_info.subtraction);
|
|
}
|
|
|
|
for (size_t i = 0; i < regs.size(); ++i) {
|
|
if (regs[i] && ABI_ALL_XMMS[i]) {
|
|
code.movaps(code.xword[code.rsp + frame_info.xmm_offset], IndexToXmm(i));
|
|
frame_info.xmm_offset += 0x10;
|
|
}
|
|
}
|
|
|
|
return ABI_SHADOW_SPACE;
|
|
}
|
|
|
|
inline void ABI_PopRegistersAndAdjustStack(Xbyak::CodeGenerator& code, std::bitset<32> regs,
|
|
size_t rsp_alignment, size_t needed_frame_size = 0) {
|
|
auto frame_info = ABI_CalculateFrameSize(regs, rsp_alignment, needed_frame_size);
|
|
|
|
for (size_t i = 0; i < regs.size(); ++i) {
|
|
if (regs[i] && ABI_ALL_XMMS[i]) {
|
|
code.movaps(IndexToXmm(i), code.xword[code.rsp + frame_info.xmm_offset]);
|
|
frame_info.xmm_offset += 0x10;
|
|
}
|
|
}
|
|
|
|
if (frame_info.subtraction != 0) {
|
|
code.add(code.rsp, frame_info.subtraction);
|
|
}
|
|
|
|
// GPRs need to be popped in reverse order
|
|
for (size_t j = 0; j < regs.size(); ++j) {
|
|
const size_t i = regs.size() - j - 1;
|
|
if (regs[i] && ABI_ALL_GPRS[i]) {
|
|
code.pop(IndexToReg64(i));
|
|
}
|
|
}
|
|
}
|
|
|
|
} // namespace Common::X64
|