backend/arm64/reg_alloc: Add flag handling

This commit is contained in:
Merry 2022-07-19 17:18:29 +01:00 committed by merry
parent 77436bbbbb
commit 8e6467bf45
4 changed files with 105 additions and 48 deletions

View file

@ -48,11 +48,10 @@ void EmitIR<IR::Opcode::GetNZFromOp>(oaknut::CodeGenerator& code, EmitContext& c
auto args = ctx.reg_alloc.GetArgumentInfo(inst); auto args = ctx.reg_alloc.GetArgumentInfo(inst);
auto Wvalue = ctx.reg_alloc.ReadW(args[0]); auto Wvalue = ctx.reg_alloc.ReadW(args[0]);
auto Wnz = ctx.reg_alloc.WriteW(inst); auto flags = ctx.reg_alloc.WriteFlags(inst);
RegAlloc::Realize(Wvalue, Wnz); RegAlloc::Realize(Wvalue, flags);
code.CMP(*Wnz, WZR); code.CMP(*Wvalue, WZR);
code.MRS(Wnz->toX(), static_cast<oaknut::SystemReg>(0b11'011'0100'0010'000));
} }
EmittedBlockInfo EmitArm64(oaknut::CodeGenerator& code, IR::Block block, const EmitConfig& emit_conf) { EmittedBlockInfo EmitArm64(oaknut::CodeGenerator& code, IR::Block block, const EmitConfig& emit_conf) {

View file

@ -47,6 +47,7 @@ void EmitIR<IR::Opcode::LogicalShiftLeft32>(oaknut::CodeGenerator& code, EmitCon
auto Woperand = ctx.reg_alloc.ReadW(operand_arg); auto Woperand = ctx.reg_alloc.ReadW(operand_arg);
auto Wshift = ctx.reg_alloc.ReadW(shift_arg); auto Wshift = ctx.reg_alloc.ReadW(shift_arg);
RegAlloc::Realize(Wresult, Woperand, Wshift); RegAlloc::Realize(Wresult, Woperand, Wshift);
ctx.reg_alloc.SpillFlags();
code.AND(Wscratch0, Wshift, 0xff); code.AND(Wscratch0, Wshift, 0xff);
code.LSL(Wresult, Woperand, Wscratch0); code.LSL(Wresult, Woperand, Wscratch0);
@ -83,6 +84,7 @@ void EmitIR<IR::Opcode::LogicalShiftLeft32>(oaknut::CodeGenerator& code, EmitCon
auto Wshift = ctx.reg_alloc.ReadW(shift_arg); auto Wshift = ctx.reg_alloc.ReadW(shift_arg);
auto Wcarry_in = ctx.reg_alloc.ReadW(carry_arg); auto Wcarry_in = ctx.reg_alloc.ReadW(carry_arg);
RegAlloc::Realize(Wresult, Wcarry_out, Woperand, Wshift, Wcarry_in); RegAlloc::Realize(Wresult, Wcarry_out, Woperand, Wshift, Wcarry_in);
ctx.reg_alloc.SpillFlags();
// TODO: Use RMIF // TODO: Use RMIF

View file

@ -88,10 +88,8 @@ bool RegAlloc::IsValueLive(IR::Inst* inst) const {
return !!ValueLocation(inst); return !!ValueLocation(inst);
} }
template<bool is_vector> template<HostLoc::Kind required_kind>
int RegAlloc::RealizeReadImpl(const IR::Inst* value) { int RegAlloc::RealizeReadImpl(const IR::Inst* value) {
constexpr HostLoc::Kind required_kind = is_vector ? HostLoc::Kind::Fpr : HostLoc::Kind::Gpr;
const auto current_location = ValueLocation(value); const auto current_location = ValueLocation(value);
ASSERT(current_location); ASSERT(current_location);
@ -103,26 +101,7 @@ int RegAlloc::RealizeReadImpl(const IR::Inst* value) {
ASSERT(!ValueInfo(*current_location).realized); ASSERT(!ValueInfo(*current_location).realized);
ASSERT(ValueInfo(*current_location).locked); ASSERT(ValueInfo(*current_location).locked);
if constexpr (is_vector) { if constexpr (required_kind == HostLoc::Kind::Gpr) {
const int new_location_index = AllocateRegister(fprs, fpr_order);
SpillFpr(new_location_index);
switch (current_location->kind) {
case HostLoc::Kind::Gpr:
code.FMOV(oaknut::DReg{new_location_index}, oaknut::XReg{current_location->index});
break;
case HostLoc::Kind::Fpr:
ASSERT_FALSE("Logic error");
break;
case HostLoc::Kind::Spill:
code.LDR(oaknut::QReg{new_location_index}, SP, spill_offset + new_location_index * spill_slot_size);
break;
}
fprs[new_location_index] = std::exchange(ValueInfo(*current_location), {});
fprs[new_location_index].realized = true;
return new_location_index;
} else {
const int new_location_index = AllocateRegister(gprs, gpr_order); const int new_location_index = AllocateRegister(gprs, gpr_order);
SpillGpr(new_location_index); SpillGpr(new_location_index);
@ -137,15 +116,44 @@ int RegAlloc::RealizeReadImpl(const IR::Inst* value) {
case HostLoc::Kind::Spill: case HostLoc::Kind::Spill:
code.LDR(oaknut::XReg{new_location_index}, SP, spill_offset + new_location_index * spill_slot_size); code.LDR(oaknut::XReg{new_location_index}, SP, spill_offset + new_location_index * spill_slot_size);
break; break;
case HostLoc::Kind::Flags:
code.MRS(oaknut::XReg{new_location_index}, static_cast<oaknut::SystemReg>(0b11'011'0100'0010'000));
break;
} }
gprs[new_location_index] = std::exchange(ValueInfo(*current_location), {}); gprs[new_location_index] = std::exchange(ValueInfo(*current_location), {});
gprs[new_location_index].realized = true; gprs[new_location_index].realized = true;
return new_location_index; return new_location_index;
} else if constexpr (required_kind == HostLoc::Kind::Fpr) {
const int new_location_index = AllocateRegister(fprs, fpr_order);
SpillFpr(new_location_index);
switch (current_location->kind) {
case HostLoc::Kind::Gpr:
code.FMOV(oaknut::DReg{new_location_index}, oaknut::XReg{current_location->index});
break;
case HostLoc::Kind::Fpr:
ASSERT_FALSE("Logic error");
break;
case HostLoc::Kind::Spill:
code.LDR(oaknut::QReg{new_location_index}, SP, spill_offset + new_location_index * spill_slot_size);
break;
case HostLoc::Kind::Flags:
ASSERT_FALSE("Moving from flags into fprs is not currently supported");
break;
}
fprs[new_location_index] = std::exchange(ValueInfo(*current_location), {});
fprs[new_location_index].realized = true;
return new_location_index;
} else if constexpr (required_kind == HostLoc::Kind::Flags) {
ASSERT_FALSE("Loading flags back into NZCV is not currently supported");
} else {
static_assert(required_kind == HostLoc::Kind::Fpr || required_kind == HostLoc::Kind::Gpr || required_kind == HostLoc::Kind::Flags);
} }
} }
template<bool is_vector> template<HostLoc::Kind kind>
int RegAlloc::RealizeWriteImpl(const IR::Inst* value) { int RegAlloc::RealizeWriteImpl(const IR::Inst* value) {
ASSERT(!ValueLocation(value)); ASSERT(!ValueLocation(value));
@ -157,23 +165,31 @@ int RegAlloc::RealizeWriteImpl(const IR::Inst* value) {
info.expected_uses += value->UseCount(); info.expected_uses += value->UseCount();
}; };
if constexpr (is_vector) { if constexpr (kind == HostLoc::Kind::Gpr) {
const int new_location_index = AllocateRegister(fprs, fpr_order);
SpillFpr(new_location_index);
setup_location(fprs[new_location_index]);
return new_location_index;
} else {
const int new_location_index = AllocateRegister(gprs, gpr_order); const int new_location_index = AllocateRegister(gprs, gpr_order);
SpillGpr(new_location_index); SpillGpr(new_location_index);
setup_location(gprs[new_location_index]); setup_location(gprs[new_location_index]);
return new_location_index; return new_location_index;
} else if constexpr (kind == HostLoc::Kind::Fpr) {
const int new_location_index = AllocateRegister(fprs, fpr_order);
SpillFpr(new_location_index);
setup_location(fprs[new_location_index]);
return new_location_index;
} else if constexpr (kind == HostLoc::Kind::Flags) {
ASSERT(flags.values.empty());
setup_location(flags);
return 0;
} else {
static_assert(kind == HostLoc::Kind::Fpr || kind == HostLoc::Kind::Gpr || kind == HostLoc::Kind::Flags);
} }
} }
template int RegAlloc::RealizeReadImpl<true>(const IR::Inst* value); template int RegAlloc::RealizeReadImpl<HostLoc::Kind::Gpr>(const IR::Inst* value);
template int RegAlloc::RealizeReadImpl<false>(const IR::Inst* value); template int RegAlloc::RealizeReadImpl<HostLoc::Kind::Fpr>(const IR::Inst* value);
template int RegAlloc::RealizeWriteImpl<true>(const IR::Inst* value); template int RegAlloc::RealizeReadImpl<HostLoc::Kind::Flags>(const IR::Inst* value);
template int RegAlloc::RealizeWriteImpl<false>(const IR::Inst* value); template int RegAlloc::RealizeWriteImpl<HostLoc::Kind::Gpr>(const IR::Inst* value);
template int RegAlloc::RealizeWriteImpl<HostLoc::Kind::Fpr>(const IR::Inst* value);
template int RegAlloc::RealizeWriteImpl<HostLoc::Kind::Flags>(const IR::Inst* value);
void RegAlloc::Unlock(HostLoc host_loc) { void RegAlloc::Unlock(HostLoc host_loc) {
HostLocInfo& info = ValueInfo(host_loc); HostLocInfo& info = ValueInfo(host_loc);
@ -223,6 +239,17 @@ void RegAlloc::SpillFpr(int index) {
spills[new_location_index] = std::exchange(fprs[index], {}); spills[new_location_index] = std::exchange(fprs[index], {});
} }
void RegAlloc::SpillFlags() {
ASSERT(!flags.locked && !flags.realized);
if (flags.values.empty()) {
return;
}
const int new_location_index = AllocateRegister(gprs, gpr_order);
SpillGpr(new_location_index);
code.MRS(oaknut::XReg{new_location_index}, static_cast<oaknut::SystemReg>(0b11'011'0100'0010'000));
gprs[new_location_index] = std::exchange(flags, {});
}
int RegAlloc::FindFreeSpill() const { int RegAlloc::FindFreeSpill() const {
const auto iter = std::find_if(spills.begin(), spills.end(), [](const HostLocInfo& info) { return info.values.empty(); }); const auto iter = std::find_if(spills.begin(), spills.end(), [](const HostLocInfo& info) { return info.values.empty(); });
ASSERT_MSG(iter != spills.end(), "All spill locations are full"); ASSERT_MSG(iter != spills.end(), "All spill locations are full");
@ -240,6 +267,9 @@ std::optional<HostLoc> RegAlloc::ValueLocation(const IR::Inst* value) const {
if (const auto iter = std::find_if(fprs.begin(), fprs.end(), contains_value); iter != fprs.end()) { if (const auto iter = std::find_if(fprs.begin(), fprs.end(), contains_value); iter != fprs.end()) {
return HostLoc{HostLoc::Kind::Fpr, static_cast<int>(iter - fprs.begin())}; return HostLoc{HostLoc::Kind::Fpr, static_cast<int>(iter - fprs.begin())};
} }
if (contains_value(flags)) {
return HostLoc{HostLoc::Kind::Flags, 0};
}
if (const auto iter = std::find_if(spills.begin(), spills.end(), contains_value); iter != spills.end()) { if (const auto iter = std::find_if(spills.begin(), spills.end(), contains_value); iter != spills.end()) {
return HostLoc{HostLoc::Kind::Spill, static_cast<int>(iter - spills.begin())}; return HostLoc{HostLoc::Kind::Spill, static_cast<int>(iter - spills.begin())};
} }
@ -252,6 +282,8 @@ HostLocInfo& RegAlloc::ValueInfo(HostLoc host_loc) {
return gprs[static_cast<size_t>(host_loc.index)]; return gprs[static_cast<size_t>(host_loc.index)];
case HostLoc::Kind::Fpr: case HostLoc::Kind::Fpr:
return fprs[static_cast<size_t>(host_loc.index)]; return fprs[static_cast<size_t>(host_loc.index)];
case HostLoc::Kind::Flags:
return flags;
case HostLoc::Kind::Spill: case HostLoc::Kind::Spill:
return spills[static_cast<size_t>(host_loc.index)]; return spills[static_cast<size_t>(host_loc.index)];
} }
@ -263,13 +295,16 @@ HostLocInfo& RegAlloc::ValueInfo(const IR::Inst* value) {
return info.values.contains(value); return info.values.contains(value);
}; };
if (const auto iter = std::find_if(gprs.begin(), gprs.end(), contains_value)) { if (const auto iter = std::find_if(gprs.begin(), gprs.end(), contains_value); iter != gprs.end()) {
return *iter; return *iter;
} }
if (const auto iter = std::find_if(fprs.begin(), fprs.end(), contains_value)) { if (const auto iter = std::find_if(fprs.begin(), fprs.end(), contains_value); iter != gprs.end()) {
return *iter; return *iter;
} }
if (const auto iter = std::find_if(spills.begin(), spills.end(), contains_value)) { if (contains_value(flags)) {
return flags;
}
if (const auto iter = std::find_if(spills.begin(), spills.end(), contains_value); iter != gprs.end()) {
return *iter; return *iter;
} }
ASSERT_FALSE("RegAlloc::ValueInfo: Value not found"); ASSERT_FALSE("RegAlloc::ValueInfo: Value not found");

View file

@ -30,6 +30,7 @@ struct HostLoc {
enum class Kind { enum class Kind {
Gpr, Gpr,
Fpr, Fpr,
Flags,
Spill, Spill,
} kind; } kind;
int index; int index;
@ -60,10 +61,23 @@ private:
IR::Value value; IR::Value value;
}; };
struct FlagsTag {
private:
template<typename>
friend struct RAReg;
explicit FlagsTag(int) {}
int index() const { return 0; }
};
template<typename T> template<typename T>
struct RAReg { struct RAReg {
public: public:
static constexpr bool is_vector = std::is_base_of_v<oaknut::VReg, T>; static constexpr HostLoc::Kind kind = !std::is_same_v<FlagsTag, T>
? std::is_base_of_v<oaknut::VReg, T>
? HostLoc::Kind::Fpr
: HostLoc::Kind::Gpr
: HostLoc::Kind::Flags;
operator T() const { return *reg; } operator T() const { return *reg; }
@ -120,6 +134,8 @@ public:
auto ReadH(Argument& arg) { return RAReg<oaknut::HReg>{*this, false, PreReadImpl(arg.value)}; } auto ReadH(Argument& arg) { return RAReg<oaknut::HReg>{*this, false, PreReadImpl(arg.value)}; }
auto ReadB(Argument& arg) { return RAReg<oaknut::BReg>{*this, false, PreReadImpl(arg.value)}; } auto ReadB(Argument& arg) { return RAReg<oaknut::BReg>{*this, false, PreReadImpl(arg.value)}; }
auto ReadFlags(Argument& arg) { return RAReg<FlagsTag>{*this, false, PreReadImpl(arg.value)}; }
template<size_t size> template<size_t size>
auto ReadReg(Argument& arg) { auto ReadReg(Argument& arg) {
if constexpr (size == 64) { if constexpr (size == 64) {
@ -157,6 +173,8 @@ public:
auto WriteH(IR::Inst* inst) { return RAReg<oaknut::HReg>{*this, true, inst}; } auto WriteH(IR::Inst* inst) { return RAReg<oaknut::HReg>{*this, true, inst}; }
auto WriteB(IR::Inst* inst) { return RAReg<oaknut::BReg>{*this, true, inst}; } auto WriteB(IR::Inst* inst) { return RAReg<oaknut::BReg>{*this, true, inst}; }
auto WriteFlags(IR::Inst* inst) { return RAReg<FlagsTag>{*this, true, inst}; }
template<size_t size> template<size_t size>
auto WriteReg(IR::Inst* inst) { auto WriteReg(IR::Inst* inst) {
if constexpr (size == 64) { if constexpr (size == 64) {
@ -185,6 +203,7 @@ public:
} }
} }
void SpillFlags();
void SpillAll(); void SpillAll();
template<typename... Ts> template<typename... Ts>
@ -198,13 +217,14 @@ private:
friend struct RAReg; friend struct RAReg;
const IR::Inst* PreReadImpl(const IR::Value& value) { const IR::Inst* PreReadImpl(const IR::Value& value) {
ValueInfo(value.GetInst()).locked = true; const IR::Inst* inst = value.GetInst();
return value.GetInst(); ValueInfo(inst).locked = true;
return inst;
} }
template<bool is_vector> template<HostLoc::Kind kind>
int RealizeReadImpl(const IR::Inst* value); int RealizeReadImpl(const IR::Inst* value);
template<bool is_vector> template<HostLoc::Kind kind>
int RealizeWriteImpl(const IR::Inst* value); int RealizeWriteImpl(const IR::Inst* value);
void Unlock(HostLoc host_loc); void Unlock(HostLoc host_loc);
@ -223,6 +243,7 @@ private:
std::array<HostLocInfo, 32> gprs; std::array<HostLocInfo, 32> gprs;
std::array<HostLocInfo, 32> fprs; std::array<HostLocInfo, 32> fprs;
HostLocInfo flags;
std::array<HostLocInfo, SpillCount> spills; std::array<HostLocInfo, SpillCount> spills;
mutable std::mt19937 rand_gen; mutable std::mt19937 rand_gen;
@ -231,13 +252,13 @@ private:
template<typename T> template<typename T>
RAReg<T>::~RAReg() { RAReg<T>::~RAReg() {
if (reg) { if (reg) {
reg_alloc.Unlock(HostLoc{is_vector ? HostLoc::Kind::Fpr : HostLoc::Kind::Gpr, reg->index()}); reg_alloc.Unlock(HostLoc{kind, reg->index()});
} }
} }
template<typename T> template<typename T>
void RAReg<T>::Realize() { void RAReg<T>::Realize() {
reg = T{write ? reg_alloc.RealizeWriteImpl<is_vector>(value) : reg_alloc.RealizeReadImpl<is_vector>(value)}; reg = T{write ? reg_alloc.RealizeWriteImpl<kind>(value) : reg_alloc.RealizeReadImpl<kind>(value)};
} }
} // namespace Dynarmic::Backend::Arm64 } // namespace Dynarmic::Backend::Arm64