| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518 |
- using ARMeilleure.Decoders;
- using ARMeilleure.IntermediateRepresentation;
- using ARMeilleure.Translation;
- using System;
- using System.Diagnostics;
- using static ARMeilleure.Instructions.InstEmitHelper;
- using static ARMeilleure.Instructions.InstEmitSimdHelper;
- using static ARMeilleure.IntermediateRepresentation.Operand.Factory;
- namespace ARMeilleure.Instructions
- {
- static partial class InstEmit
- {
- public static void And_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdReg op = (OpCodeSimdReg)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand m = GetVec(op.Rm);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pand, n, m);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorBinaryOpZx(context, (op1, op2) => context.BitwiseAnd(op1, op2));
- }
- }
- public static void Bic_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdReg op = (OpCodeSimdReg)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand m = GetVec(op.Rm);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pandn, m, n);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorBinaryOpZx(context, (op1, op2) =>
- {
- return context.BitwiseAnd(op1, context.BitwiseNot(op2));
- });
- }
- }
- public static void Bic_Vi(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdImm op = (OpCodeSimdImm)context.CurrOp;
- int eSize = 8 << op.Size;
- Operand d = GetVec(op.Rd);
- Operand imm = eSize switch {
- 16 => X86GetAllElements(context, (short)~op.Immediate),
- 32 => X86GetAllElements(context, (int)~op.Immediate),
- _ => throw new InvalidOperationException($"Invalid element size {eSize}.")
- };
- Operand res = context.AddIntrinsic(Intrinsic.X86Pand, d, imm);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorImmBinaryOp(context, (op1, op2) =>
- {
- return context.BitwiseAnd(op1, context.BitwiseNot(op2));
- });
- }
- }
- public static void Bif_V(ArmEmitterContext context)
- {
- EmitBifBit(context, notRm: true);
- }
- public static void Bit_V(ArmEmitterContext context)
- {
- EmitBifBit(context, notRm: false);
- }
- private static void EmitBifBit(ArmEmitterContext context, bool notRm)
- {
- OpCodeSimdReg op = (OpCodeSimdReg)context.CurrOp;
- if (Optimizations.UseSse2)
- {
- Operand d = GetVec(op.Rd);
- Operand n = GetVec(op.Rn);
- Operand m = GetVec(op.Rm);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pxor, n, d);
- if (notRm)
- {
- res = context.AddIntrinsic(Intrinsic.X86Pandn, m, res);
- }
- else
- {
- res = context.AddIntrinsic(Intrinsic.X86Pand, m, res);
- }
- res = context.AddIntrinsic(Intrinsic.X86Pxor, d, res);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(d, res);
- }
- else
- {
- Operand res = context.VectorZero();
- int elems = op.RegisterSize == RegisterSize.Simd128 ? 2 : 1;
- for (int index = 0; index < elems; index++)
- {
- Operand d = EmitVectorExtractZx(context, op.Rd, index, 3);
- Operand n = EmitVectorExtractZx(context, op.Rn, index, 3);
- Operand m = EmitVectorExtractZx(context, op.Rm, index, 3);
- if (notRm)
- {
- m = context.BitwiseNot(m);
- }
- Operand e = context.BitwiseExclusiveOr(d, n);
- e = context.BitwiseAnd(e, m);
- e = context.BitwiseExclusiveOr(e, d);
- res = EmitVectorInsert(context, res, e, index, 3);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- }
- public static void Bsl_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdReg op = (OpCodeSimdReg)context.CurrOp;
- Operand d = GetVec(op.Rd);
- Operand n = GetVec(op.Rn);
- Operand m = GetVec(op.Rm);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pxor, n, m);
- res = context.AddIntrinsic(Intrinsic.X86Pand, res, d);
- res = context.AddIntrinsic(Intrinsic.X86Pxor, res, m);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(d, res);
- }
- else
- {
- EmitVectorTernaryOpZx(context, (op1, op2, op3) =>
- {
- return context.BitwiseExclusiveOr(
- context.BitwiseAnd(op1,
- context.BitwiseExclusiveOr(op2, op3)), op3);
- });
- }
- }
- public static void Eor_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdReg op = (OpCodeSimdReg)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand m = GetVec(op.Rm);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pxor, n, m);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorBinaryOpZx(context, (op1, op2) => context.BitwiseExclusiveOr(op1, op2));
- }
- }
- public static void Not_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimd op = (OpCodeSimd)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand mask = X86GetAllElements(context, -1L);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pandn, n, mask);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorUnaryOpZx(context, (op1) => context.BitwiseNot(op1));
- }
- }
- public static void Orn_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdReg op = (OpCodeSimdReg)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand m = GetVec(op.Rm);
- Operand mask = X86GetAllElements(context, -1L);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pandn, m, mask);
- res = context.AddIntrinsic(Intrinsic.X86Por, res, n);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorBinaryOpZx(context, (op1, op2) =>
- {
- return context.BitwiseOr(op1, context.BitwiseNot(op2));
- });
- }
- }
- public static void Orr_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdReg op = (OpCodeSimdReg)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand m = GetVec(op.Rm);
- Operand res = context.AddIntrinsic(Intrinsic.X86Por, n, m);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorBinaryOpZx(context, (op1, op2) => context.BitwiseOr(op1, op2));
- }
- }
- public static void Orr_Vi(ArmEmitterContext context)
- {
- if (Optimizations.UseSse2)
- {
- OpCodeSimdImm op = (OpCodeSimdImm)context.CurrOp;
- int eSize = 8 << op.Size;
- Operand d = GetVec(op.Rd);
- Operand imm = eSize switch {
- 16 => X86GetAllElements(context, (short)op.Immediate),
- 32 => X86GetAllElements(context, (int)op.Immediate),
- _ => throw new InvalidOperationException($"Invalid element size {eSize}.")
- };
- Operand res = context.AddIntrinsic(Intrinsic.X86Por, d, imm);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitVectorImmBinaryOp(context, (op1, op2) => context.BitwiseOr(op1, op2));
- }
- }
- public static void Rbit_V(ArmEmitterContext context)
- {
- OpCodeSimd op = (OpCodeSimd)context.CurrOp;
- Operand res = context.VectorZero();
- int elems = op.RegisterSize == RegisterSize.Simd128 ? 16 : 8;
- for (int index = 0; index < elems; index++)
- {
- Operand ne = EmitVectorExtractZx(context, op.Rn, index, 0);
- Operand de = EmitReverseBits8Op(context, ne);
- res = EmitVectorInsert(context, res, de, index, 0);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- private static Operand EmitReverseBits8Op(ArmEmitterContext context, Operand op)
- {
- Debug.Assert(op.Type == OperandType.I64);
- Operand val = context.BitwiseOr(context.ShiftRightUI(context.BitwiseAnd(op, Const(0xaaul)), Const(1)),
- context.ShiftLeft (context.BitwiseAnd(op, Const(0x55ul)), Const(1)));
- val = context.BitwiseOr(context.ShiftRightUI(context.BitwiseAnd(val, Const(0xccul)), Const(2)),
- context.ShiftLeft (context.BitwiseAnd(val, Const(0x33ul)), Const(2)));
- return context.BitwiseOr(context.ShiftRightUI(val, Const(4)),
- context.ShiftLeft (context.BitwiseAnd(val, Const(0x0ful)), Const(4)));
- }
- public static void Rev16_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSsse3)
- {
- OpCodeSimd op = (OpCodeSimd)context.CurrOp;
- Operand n = GetVec(op.Rn);
- const long maskE0 = 06L << 56 | 07L << 48 | 04L << 40 | 05L << 32 | 02L << 24 | 03L << 16 | 00L << 8 | 01L << 0;
- const long maskE1 = 14L << 56 | 15L << 48 | 12L << 40 | 13L << 32 | 10L << 24 | 11L << 16 | 08L << 8 | 09L << 0;
- Operand mask = X86GetScalar(context, maskE0);
- mask = EmitVectorInsert(context, mask, Const(maskE1), 1, 3);
- Operand res = context.AddIntrinsic(Intrinsic.X86Pshufb, n, mask);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitRev_V(context, containerSize: 1);
- }
- }
- public static void Rev32_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSsse3)
- {
- OpCodeSimd op = (OpCodeSimd)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand mask;
- if (op.Size == 0)
- {
- const long maskE0 = 04L << 56 | 05L << 48 | 06L << 40 | 07L << 32 | 00L << 24 | 01L << 16 | 02L << 8 | 03L << 0;
- const long maskE1 = 12L << 56 | 13L << 48 | 14L << 40 | 15L << 32 | 08L << 24 | 09L << 16 | 10L << 8 | 11L << 0;
- mask = X86GetScalar(context, maskE0);
- mask = EmitVectorInsert(context, mask, Const(maskE1), 1, 3);
- }
- else /* if (op.Size == 1) */
- {
- const long maskE0 = 05L << 56 | 04L << 48 | 07L << 40 | 06L << 32 | 01L << 24 | 00L << 16 | 03L << 8 | 02L << 0;
- const long maskE1 = 13L << 56 | 12L << 48 | 15L << 40 | 14L << 32 | 09L << 24 | 08L << 16 | 11L << 8 | 10L << 0;
- mask = X86GetScalar(context, maskE0);
- mask = EmitVectorInsert(context, mask, Const(maskE1), 1, 3);
- }
- Operand res = context.AddIntrinsic(Intrinsic.X86Pshufb, n, mask);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitRev_V(context, containerSize: 2);
- }
- }
- public static void Rev64_V(ArmEmitterContext context)
- {
- if (Optimizations.UseSsse3)
- {
- OpCodeSimd op = (OpCodeSimd)context.CurrOp;
- Operand n = GetVec(op.Rn);
- Operand mask;
- if (op.Size == 0)
- {
- const long maskE0 = 00L << 56 | 01L << 48 | 02L << 40 | 03L << 32 | 04L << 24 | 05L << 16 | 06L << 8 | 07L << 0;
- const long maskE1 = 08L << 56 | 09L << 48 | 10L << 40 | 11L << 32 | 12L << 24 | 13L << 16 | 14L << 8 | 15L << 0;
- mask = X86GetScalar(context, maskE0);
- mask = EmitVectorInsert(context, mask, Const(maskE1), 1, 3);
- }
- else if (op.Size == 1)
- {
- const long maskE0 = 01L << 56 | 00L << 48 | 03L << 40 | 02L << 32 | 05L << 24 | 04L << 16 | 07L << 8 | 06L << 0;
- const long maskE1 = 09L << 56 | 08L << 48 | 11L << 40 | 10L << 32 | 13L << 24 | 12L << 16 | 15L << 8 | 14L << 0;
- mask = X86GetScalar(context, maskE0);
- mask = EmitVectorInsert(context, mask, Const(maskE1), 1, 3);
- }
- else /* if (op.Size == 2) */
- {
- const long maskE0 = 03L << 56 | 02L << 48 | 01L << 40 | 00L << 32 | 07L << 24 | 06L << 16 | 05L << 8 | 04L << 0;
- const long maskE1 = 11L << 56 | 10L << 48 | 09L << 40 | 08L << 32 | 15L << 24 | 14L << 16 | 13L << 8 | 12L << 0;
- mask = X86GetScalar(context, maskE0);
- mask = EmitVectorInsert(context, mask, Const(maskE1), 1, 3);
- }
- Operand res = context.AddIntrinsic(Intrinsic.X86Pshufb, n, mask);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- res = context.VectorZeroUpper64(res);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- else
- {
- EmitRev_V(context, containerSize: 3);
- }
- }
- private static void EmitRev_V(ArmEmitterContext context, int containerSize)
- {
- OpCodeSimd op = (OpCodeSimd)context.CurrOp;
- Operand res = context.VectorZero();
- int elems = op.GetBytesCount() >> op.Size;
- int containerMask = (1 << (containerSize - op.Size)) - 1;
- for (int index = 0; index < elems; index++)
- {
- int revIndex = index ^ containerMask;
- Operand ne = EmitVectorExtractZx(context, op.Rn, revIndex, op.Size);
- res = EmitVectorInsert(context, res, ne, index, op.Size);
- }
- context.Copy(GetVec(op.Rd), res);
- }
- }
- }
|