From e41640fe332a64ec2be3aab47680a379320f968c Mon Sep 17 00:00:00 2001 From: Lioncash Date: Mon, 23 Apr 2018 11:16:25 -0400 Subject: [PATCH] A64: Implement RADDHN/RADDHN2 --- src/frontend/A64/decoder/a64.inc | 2 +- .../A64/translate/impl/simd_three_same.cpp | 38 +++++++++++++++---- 2 files changed, 31 insertions(+), 9 deletions(-) diff --git a/src/frontend/A64/decoder/a64.inc b/src/frontend/A64/decoder/a64.inc index e25b9f32..4eaef82a 100644 --- a/src/frontend/A64/decoder/a64.inc +++ b/src/frontend/A64/decoder/a64.inc @@ -691,7 +691,7 @@ INST(UADDL, "UADDL, UADDL2", "0Q101 INST(UADDW, "UADDW, UADDW2", "0Q101110zz1mmmmm000100nnnnnddddd") INST(USUBL, "USUBL, USUBL2", "0Q101110zz1mmmmm001000nnnnnddddd") INST(USUBW, "USUBW, USUBW2", "0Q101110zz1mmmmm001100nnnnnddddd") -//INST(RADDHN, "RADDHN, RADDHN2", "0Q101110zz1mmmmm010000nnnnnddddd") +INST(RADDHN, "RADDHN, RADDHN2", "0Q101110zz1mmmmm010000nnnnnddddd") //INST(UABAL, "UABAL, UABAL2", "0Q101110zz1mmmmm010100nnnnnddddd") //INST(RSUBHN, "RSUBHN, RSUBHN2", "0Q101110zz1mmmmm011000nnnnnddddd") //INST(UABDL, "UABDL, UABDL2", "0Q101110zz1mmmmm011100nnnnnddddd") diff --git a/src/frontend/A64/translate/impl/simd_three_same.cpp b/src/frontend/A64/translate/impl/simd_three_same.cpp index 1501d694..670d99bc 100644 --- a/src/frontend/A64/translate/impl/simd_three_same.cpp +++ b/src/frontend/A64/translate/impl/simd_three_same.cpp @@ -13,21 +13,34 @@ enum class HighNarrowingOp { Subtract, }; +enum class ExtraBehavior { + None, + Round +}; + static void HighNarrowingOperation(TranslatorVisitor& v, bool Q, Imm<2> size, Vec Vm, Vec Vn, Vec Vd, - HighNarrowingOp op) { + HighNarrowingOp op, ExtraBehavior behavior) { const size_t part = Q; const size_t esize = 8 << size.ZeroExtend(); + const size_t doubled_esize = 2 * esize; const IR::U128 operand1 = v.ir.GetQ(Vn); const IR::U128 operand2 = v.ir.GetQ(Vm); - const IR::U128 wide = [&] { + IR::U128 wide = [&] { if (op == HighNarrowingOp::Add) { - return v.ir.VectorAdd(2 * esize, operand1, operand2); + return v.ir.VectorAdd(doubled_esize, operand1, operand2); } - return v.ir.VectorSub(2 * esize, operand1, operand2); + return v.ir.VectorSub(doubled_esize, operand1, operand2); }(); - const IR::U128 result = v.ir.VectorNarrow(2 * esize, - v.ir.VectorLogicalShiftRight(2 * esize, wide, static_cast(esize))); + + if (behavior == ExtraBehavior::Round) { + const u64 round_const = 1ULL << (esize - 1); + const IR::U128 round_operand = v.ir.VectorBroadcast(doubled_esize, v.I(doubled_esize, round_const)); + wide = v.ir.VectorAdd(doubled_esize, wide, round_operand); + } + + const IR::U128 result = v.ir.VectorNarrow(doubled_esize, + v.ir.VectorLogicalShiftRight(doubled_esize, wide, static_cast(esize))); v.Vpart(64, Vd, part, result); } @@ -139,7 +152,16 @@ bool TranslatorVisitor::ADDHN(bool Q, Imm<2> size, Vec Vm, Vec Vn, Vec Vd) { return ReservedValue(); } - HighNarrowingOperation(*this, Q, size, Vm, Vn, Vd, HighNarrowingOp::Add); + HighNarrowingOperation(*this, Q, size, Vm, Vn, Vd, HighNarrowingOp::Add, ExtraBehavior::None); + return true; +} + +bool TranslatorVisitor::RADDHN(bool Q, Imm<2> size, Vec Vm, Vec Vn, Vec Vd) { + if (size == 0b11) { + return ReservedValue(); + } + + HighNarrowingOperation(*this, Q, size, Vm, Vn, Vd, HighNarrowingOp::Add, ExtraBehavior::Round); return true; } @@ -148,7 +170,7 @@ bool TranslatorVisitor::SUBHN(bool Q, Imm<2> size, Vec Vm, Vec Vn, Vec Vd) { return ReservedValue(); } - HighNarrowingOperation(*this, Q, size, Vm, Vn, Vd, HighNarrowingOp::Subtract); + HighNarrowingOperation(*this, Q, size, Vm, Vn, Vd, HighNarrowingOp::Subtract, ExtraBehavior::None); return true; }