IR: Implement VectorZeroExtend
This commit is contained in:
parent
d3a4e1efe2
commit
59ace60b03
4 changed files with 61 additions and 0 deletions
|
@ -634,6 +634,47 @@ void EmitX64::EmitVectorLogicalShiftLeft64(EmitContext& ctx, IR::Inst* inst) {
|
||||||
ctx.reg_alloc.DefineValue(inst, result);
|
ctx.reg_alloc.DefineValue(inst, result);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void EmitVectorZeroExtend(BlockOfCode& code, EmitContext& ctx, IR::Inst* inst, int size) {
|
||||||
|
auto args = ctx.reg_alloc.GetArgumentInfo(inst);
|
||||||
|
|
||||||
|
const Xbyak::Xmm a = ctx.reg_alloc.UseScratchXmm(args[0]);
|
||||||
|
const Xbyak::Xmm zeros = ctx.reg_alloc.ScratchXmm();
|
||||||
|
|
||||||
|
code.pxor(zeros, zeros);
|
||||||
|
switch (size) {
|
||||||
|
case 8:
|
||||||
|
code.punpcklbw(a, zeros);
|
||||||
|
break;
|
||||||
|
case 16:
|
||||||
|
code.punpcklwd(a, zeros);
|
||||||
|
break;
|
||||||
|
case 32:
|
||||||
|
code.punpckldq(a, zeros);
|
||||||
|
break;
|
||||||
|
case 64:
|
||||||
|
code.punpcklqdq(a, zeros);
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
ctx.reg_alloc.DefineValue(inst, a);
|
||||||
|
}
|
||||||
|
|
||||||
|
void EmitX64::EmitVectorZeroExtend8(EmitContext& ctx, IR::Inst* inst) {
|
||||||
|
EmitVectorZeroExtend(code, ctx, inst, 8);
|
||||||
|
}
|
||||||
|
|
||||||
|
void EmitX64::EmitVectorZeroExtend16(EmitContext& ctx, IR::Inst* inst) {
|
||||||
|
EmitVectorZeroExtend(code, ctx, inst, 16);
|
||||||
|
}
|
||||||
|
|
||||||
|
void EmitX64::EmitVectorZeroExtend32(EmitContext& ctx, IR::Inst* inst) {
|
||||||
|
EmitVectorZeroExtend(code, ctx, inst, 32);
|
||||||
|
}
|
||||||
|
|
||||||
|
void EmitX64::EmitVectorZeroExtend64(EmitContext& ctx, IR::Inst* inst) {
|
||||||
|
EmitVectorZeroExtend(code, ctx, inst, 64);
|
||||||
|
}
|
||||||
|
|
||||||
void EmitX64::EmitVectorZeroUpper(EmitContext& ctx, IR::Inst* inst) {
|
void EmitX64::EmitVectorZeroUpper(EmitContext& ctx, IR::Inst* inst) {
|
||||||
auto args = ctx.reg_alloc.GetArgumentInfo(inst);
|
auto args = ctx.reg_alloc.GetArgumentInfo(inst);
|
||||||
|
|
||||||
|
|
|
@ -919,6 +919,21 @@ U128 IREmitter::VectorPairedAdd(size_t esize, const U128& a, const U128& b) {
|
||||||
return {};
|
return {};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
U128 IREmitter::VectorZeroExtend(size_t original_esize, const U128& a) {
|
||||||
|
switch (original_esize) {
|
||||||
|
case 8:
|
||||||
|
return Inst<U128>(Opcode::VectorZeroExtend8, a);
|
||||||
|
case 16:
|
||||||
|
return Inst<U128>(Opcode::VectorZeroExtend16, a);
|
||||||
|
case 32:
|
||||||
|
return Inst<U128>(Opcode::VectorZeroExtend32, a);
|
||||||
|
case 64:
|
||||||
|
return Inst<U128>(Opcode::VectorZeroExtend64, a);
|
||||||
|
}
|
||||||
|
UNREACHABLE();
|
||||||
|
return {};
|
||||||
|
}
|
||||||
|
|
||||||
U128 IREmitter::VectorZeroUpper(const U128& a) {
|
U128 IREmitter::VectorZeroUpper(const U128& a) {
|
||||||
return Inst<U128>(Opcode::VectorZeroUpper, a);
|
return Inst<U128>(Opcode::VectorZeroUpper, a);
|
||||||
}
|
}
|
||||||
|
|
|
@ -219,6 +219,7 @@ public:
|
||||||
U128 VectorOr(const U128& a, const U128& b);
|
U128 VectorOr(const U128& a, const U128& b);
|
||||||
U128 VectorPairedAdd(size_t esize, const U128& a, const U128& b);
|
U128 VectorPairedAdd(size_t esize, const U128& a, const U128& b);
|
||||||
U128 VectorPairedAddLower(size_t esize, const U128& a, const U128& b);
|
U128 VectorPairedAddLower(size_t esize, const U128& a, const U128& b);
|
||||||
|
U128 VectorZeroExtend(size_t original_esize, const U128& a);
|
||||||
U128 VectorZeroUpper(const U128& a);
|
U128 VectorZeroUpper(const U128& a);
|
||||||
|
|
||||||
U32U64 FPAbs(const U32U64& a);
|
U32U64 FPAbs(const U32U64& a);
|
||||||
|
|
|
@ -233,6 +233,10 @@ OPCODE(VectorPairedAdd8, T::U128, T::U128, T::U128
|
||||||
OPCODE(VectorPairedAdd16, T::U128, T::U128, T::U128 )
|
OPCODE(VectorPairedAdd16, T::U128, T::U128, T::U128 )
|
||||||
OPCODE(VectorPairedAdd32, T::U128, T::U128, T::U128 )
|
OPCODE(VectorPairedAdd32, T::U128, T::U128, T::U128 )
|
||||||
OPCODE(VectorPairedAdd64, T::U128, T::U128, T::U128 )
|
OPCODE(VectorPairedAdd64, T::U128, T::U128, T::U128 )
|
||||||
|
OPCODE(VectorZeroExtend8, T::U128, T::U128 )
|
||||||
|
OPCODE(VectorZeroExtend16, T::U128, T::U128 )
|
||||||
|
OPCODE(VectorZeroExtend32, T::U128, T::U128 )
|
||||||
|
OPCODE(VectorZeroExtend64, T::U128, T::U128 )
|
||||||
OPCODE(VectorZeroUpper, T::U128, T::U128 )
|
OPCODE(VectorZeroUpper, T::U128, T::U128 )
|
||||||
|
|
||||||
// Floating-point operations
|
// Floating-point operations
|
||||||
|
|
Loading…
Add table
Reference in a new issue