| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793 |
- using ChocolArm64.Decoders;
- using ChocolArm64.IntermediateRepresentation;
- using ChocolArm64.State;
- using ChocolArm64.Translation;
- using System;
- using System.Reflection.Emit;
- using System.Runtime.Intrinsics;
- using System.Runtime.Intrinsics.X86;
- using static ChocolArm64.Instructions.InstEmitSimdHelper;
- namespace ChocolArm64.Instructions
- {
- static partial class InstEmit
- {
- #region "Masks"
- private static readonly long[] _masksE0_TrnUzpXtn = new long[]
- {
- 14L << 56 | 12L << 48 | 10L << 40 | 08L << 32 | 06L << 24 | 04L << 16 | 02L << 8 | 00L << 0,
- 13L << 56 | 12L << 48 | 09L << 40 | 08L << 32 | 05L << 24 | 04L << 16 | 01L << 8 | 00L << 0,
- 11L << 56 | 10L << 48 | 09L << 40 | 08L << 32 | 03L << 24 | 02L << 16 | 01L << 8 | 00L << 0
- };
- private static readonly long[] _masksE1_TrnUzp = new long[]
- {
- 15L << 56 | 13L << 48 | 11L << 40 | 09L << 32 | 07L << 24 | 05L << 16 | 03L << 8 | 01L << 0,
- 15L << 56 | 14L << 48 | 11L << 40 | 10L << 32 | 07L << 24 | 06L << 16 | 03L << 8 | 02L << 0,
- 15L << 56 | 14L << 48 | 13L << 40 | 12L << 32 | 07L << 24 | 06L << 16 | 05L << 8 | 04L << 0
- };
- private static readonly long[] _masksE0_Uzp = new long[]
- {
- 13L << 56 | 09L << 48 | 05L << 40 | 01L << 32 | 12L << 24 | 08L << 16 | 04L << 8 | 00L << 0,
- 11L << 56 | 10L << 48 | 03L << 40 | 02L << 32 | 09L << 24 | 08L << 16 | 01L << 8 | 00L << 0
- };
- private static readonly long[] _masksE1_Uzp = new long[]
- {
- 15L << 56 | 11L << 48 | 07L << 40 | 03L << 32 | 14L << 24 | 10L << 16 | 06L << 8 | 02L << 0,
- 15L << 56 | 14L << 48 | 07L << 40 | 06L << 32 | 13L << 24 | 12L << 16 | 05L << 8 | 04L << 0
- };
- #endregion
- public static void Dup_Gp(ILEmitterCtx context)
- {
- OpCodeSimdIns64 op = (OpCodeSimdIns64)context.CurrOp;
- if (Optimizations.UseSse2)
- {
- Type[] typesSav = new Type[] { UIntTypesPerSizeLog2[op.Size] };
- context.EmitLdintzr(op.Rn);
- switch (op.Size)
- {
- case 0: context.Emit(OpCodes.Conv_U1); break;
- case 1: context.Emit(OpCodes.Conv_U2); break;
- case 2: context.Emit(OpCodes.Conv_U4); break;
- }
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), typesSav));
- context.EmitStvec(op.Rd);
- }
- else
- {
- int bytes = op.GetBitsCount() >> 3;
- int elems = bytes >> op.Size;
- for (int index = 0; index < elems; index++)
- {
- context.EmitLdintzr(op.Rn);
- EmitVectorInsert(context, op.Rd, index, op.Size);
- }
- }
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- public static void Dup_S(ILEmitterCtx context)
- {
- OpCodeSimdIns64 op = (OpCodeSimdIns64)context.CurrOp;
- EmitVectorExtractZx(context, op.Rn, op.DstIndex, op.Size);
- EmitScalarSet(context, op.Rd, op.Size);
- }
- public static void Dup_V(ILEmitterCtx context)
- {
- OpCodeSimdIns64 op = (OpCodeSimdIns64)context.CurrOp;
- if (Optimizations.UseSse2)
- {
- Type[] typesSav = new Type[] { UIntTypesPerSizeLog2[op.Size] };
- EmitVectorExtractZx(context, op.Rn, op.DstIndex, op.Size);
- switch (op.Size)
- {
- case 0: context.Emit(OpCodes.Conv_U1); break;
- case 1: context.Emit(OpCodes.Conv_U2); break;
- case 2: context.Emit(OpCodes.Conv_U4); break;
- }
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), typesSav));
- context.EmitStvec(op.Rd);
- }
- else
- {
- int bytes = op.GetBitsCount() >> 3;
- int elems = bytes >> op.Size;
- for (int index = 0; index < elems; index++)
- {
- EmitVectorExtractZx(context, op.Rn, op.DstIndex, op.Size);
- EmitVectorInsert(context, op.Rd, index, op.Size);
- }
- }
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- public static void Ext_V(ILEmitterCtx context)
- {
- OpCodeSimdExt64 op = (OpCodeSimdExt64)context.CurrOp;
- if (Optimizations.UseSse2)
- {
- Type[] typesShs = new Type[] { typeof(Vector128<byte>), typeof(byte) };
- Type[] typesOr = new Type[] { typeof(Vector128<byte>), typeof(Vector128<byte>) };
- context.EmitLdvec(op.Rn);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- VectorHelper.EmitCall(context, nameof(VectorHelper.VectorSingleZero));
- context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MoveLowToHigh)));
- }
- context.EmitLdc_I4(op.Imm4);
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), typesShs));
- context.EmitLdvec(op.Rm);
- context.EmitLdc_I4((op.RegisterSize == RegisterSize.Simd64 ? 8 : 16) - op.Imm4);
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftLeftLogical128BitLane), typesShs));
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- VectorHelper.EmitCall(context, nameof(VectorHelper.VectorSingleZero));
- context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MoveLowToHigh)));
- }
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Or), typesOr));
- context.EmitStvec(op.Rd);
- }
- else
- {
- int bytes = op.GetBitsCount() >> 3;
- int position = op.Imm4;
- for (int index = 0; index < bytes; index++)
- {
- int reg = op.Imm4 + index < bytes ? op.Rn : op.Rm;
- if (position == bytes)
- {
- position = 0;
- }
- EmitVectorExtractZx(context, reg, position++, 0);
- EmitVectorInsertTmp(context, index, 0);
- }
- context.EmitLdvectmp();
- context.EmitStvec(op.Rd);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- }
- public static void Fcsel_S(ILEmitterCtx context)
- {
- OpCodeSimdFcond64 op = (OpCodeSimdFcond64)context.CurrOp;
- ILLabel lblTrue = new ILLabel();
- ILLabel lblEnd = new ILLabel();
- context.EmitCondBranch(lblTrue, op.Cond);
- EmitVectorExtractF(context, op.Rm, 0, op.Size);
- context.Emit(OpCodes.Br_S, lblEnd);
- context.MarkLabel(lblTrue);
- EmitVectorExtractF(context, op.Rn, 0, op.Size);
- context.MarkLabel(lblEnd);
- EmitScalarSetF(context, op.Rd, op.Size);
- }
- public static void Fmov_Ftoi(ILEmitterCtx context)
- {
- OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
- EmitVectorExtractZx(context, op.Rn, 0, op.Size + 2);
- context.EmitStintzr(op.Rd);
- }
- public static void Fmov_Ftoi1(ILEmitterCtx context)
- {
- OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
- EmitVectorExtractZx(context, op.Rn, 1, 3);
- context.EmitStintzr(op.Rd);
- }
- public static void Fmov_Itof(ILEmitterCtx context)
- {
- OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
- context.EmitLdintzr(op.Rn);
- EmitScalarSet(context, op.Rd, op.Size + 2);
- }
- public static void Fmov_Itof1(ILEmitterCtx context)
- {
- OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
- context.EmitLdintzr(op.Rn);
- EmitVectorInsert(context, op.Rd, 1, 3);
- }
- public static void Fmov_S(ILEmitterCtx context)
- {
- OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
- EmitVectorExtractF(context, op.Rn, 0, op.Size);
- EmitScalarSetF(context, op.Rd, op.Size);
- }
- public static void Fmov_Si(ILEmitterCtx context)
- {
- OpCodeSimdFmov64 op = (OpCodeSimdFmov64)context.CurrOp;
- context.EmitLdc_I8(op.Imm);
- EmitScalarSet(context, op.Rd, op.Size + 2);
- }
- public static void Fmov_Vi(ILEmitterCtx context)
- {
- OpCodeSimdImm64 op = (OpCodeSimdImm64)context.CurrOp;
- int elems = op.RegisterSize == RegisterSize.Simd128 ? 4 : 2;
- for (int index = 0; index < (elems >> op.Size); index++)
- {
- context.EmitLdc_I8(op.Imm);
- EmitVectorInsert(context, op.Rd, index, op.Size + 2);
- }
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- public static void Ins_Gp(ILEmitterCtx context)
- {
- OpCodeSimdIns64 op = (OpCodeSimdIns64)context.CurrOp;
- context.EmitLdintzr(op.Rn);
- EmitVectorInsert(context, op.Rd, op.DstIndex, op.Size);
- }
- public static void Ins_V(ILEmitterCtx context)
- {
- OpCodeSimdIns64 op = (OpCodeSimdIns64)context.CurrOp;
- EmitVectorExtractZx(context, op.Rn, op.SrcIndex, op.Size);
- EmitVectorInsert(context, op.Rd, op.DstIndex, op.Size);
- }
- public static void Movi_V(ILEmitterCtx context)
- {
- if (Optimizations.UseSse2)
- {
- EmitMoviMvni(context, not: false);
- }
- else
- {
- EmitVectorImmUnaryOp(context, () => { });
- }
- }
- public static void Mvni_V(ILEmitterCtx context)
- {
- if (Optimizations.UseSse2)
- {
- EmitMoviMvni(context, not: true);
- }
- else
- {
- EmitVectorImmUnaryOp(context, () => context.Emit(OpCodes.Not));
- }
- }
- public static void Smov_S(ILEmitterCtx context)
- {
- OpCodeSimdIns64 op = (OpCodeSimdIns64)context.CurrOp;
- EmitVectorExtractSx(context, op.Rn, op.DstIndex, op.Size);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- context.Emit(OpCodes.Conv_U4);
- context.Emit(OpCodes.Conv_U8);
- }
- context.EmitStintzr(op.Rd);
- }
- public static void Tbl_V(ILEmitterCtx context)
- {
- OpCodeSimdTbl64 op = (OpCodeSimdTbl64)context.CurrOp;
- if (Optimizations.UseSsse3)
- {
- Type[] typesCmpSflSub = new Type[] { typeof(Vector128<sbyte>), typeof(Vector128<sbyte>) };
- Type[] typesOr = new Type[] { typeof(Vector128<long>), typeof(Vector128<long>) };
- Type[] typesSav = new Type[] { typeof(long) };
- context.EmitLdvec(op.Rn);
- context.EmitLdvec(op.Rm);
- context.EmitLdc_I8(0x0F0F0F0F0F0F0F0FL);
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), typesSav));
- context.EmitStvectmp2();
- context.EmitLdvectmp2();
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.CompareGreaterThan), typesCmpSflSub));
- context.EmitLdvec(op.Rm);
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Or), typesOr));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), typesCmpSflSub));
- for (int index = 1; index < op.Size; index++)
- {
- context.EmitLdvec((op.Rn + index) & 0x1F);
- context.EmitLdvec(op.Rm);
- context.EmitLdc_I8(0x1010101010101010L * index);
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), typesSav));
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), typesCmpSflSub));
- context.EmitStvectmp();
- context.EmitLdvectmp();
- context.EmitLdvectmp2();
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.CompareGreaterThan), typesCmpSflSub));
- context.EmitLdvectmp();
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Or), typesOr));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), typesCmpSflSub));
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Or), typesOr));
- }
- context.EmitStvec(op.Rd);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- else
- {
- context.EmitLdvec(op.Rm);
- for (int index = 0; index < op.Size; index++)
- {
- context.EmitLdvec((op.Rn + index) & 0x1F);
- }
- switch (op.Size)
- {
- case 1: VectorHelper.EmitCall(context,
- nameof(VectorHelper.Tbl1_V64),
- nameof(VectorHelper.Tbl1_V128)); break;
- case 2: VectorHelper.EmitCall(context,
- nameof(VectorHelper.Tbl2_V64),
- nameof(VectorHelper.Tbl2_V128)); break;
- case 3: VectorHelper.EmitCall(context,
- nameof(VectorHelper.Tbl3_V64),
- nameof(VectorHelper.Tbl3_V128)); break;
- case 4: VectorHelper.EmitCall(context,
- nameof(VectorHelper.Tbl4_V64),
- nameof(VectorHelper.Tbl4_V128)); break;
- default: throw new InvalidOperationException();
- }
- context.EmitStvec(op.Rd);
- }
- }
- public static void Trn1_V(ILEmitterCtx context)
- {
- EmitVectorTranspose(context, part: 0);
- }
- public static void Trn2_V(ILEmitterCtx context)
- {
- EmitVectorTranspose(context, part: 1);
- }
- public static void Umov_S(ILEmitterCtx context)
- {
- OpCodeSimdIns64 op = (OpCodeSimdIns64)context.CurrOp;
- EmitVectorExtractZx(context, op.Rn, op.DstIndex, op.Size);
- context.EmitStintzr(op.Rd);
- }
- public static void Uzp1_V(ILEmitterCtx context)
- {
- EmitVectorUnzip(context, part: 0);
- }
- public static void Uzp2_V(ILEmitterCtx context)
- {
- EmitVectorUnzip(context, part: 1);
- }
- public static void Xtn_V(ILEmitterCtx context)
- {
- OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
- if (Optimizations.UseSsse3)
- {
- Type[] typesSve = new Type[] { typeof(long), typeof(long) };
- string nameMov = op.RegisterSize == RegisterSize.Simd128
- ? nameof(Sse.MoveLowToHigh)
- : nameof(Sse.MoveHighToLow);
- context.EmitLdvec(op.Rd);
- VectorHelper.EmitCall(context, nameof(VectorHelper.VectorSingleZero));
- context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MoveLowToHigh)));
- context.EmitLdvec(op.Rn); // value
- context.EmitLdc_I8(_masksE0_TrnUzpXtn[op.Size]); // mask
- context.Emit(OpCodes.Dup); // mask
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), GetTypesSflUpk(0)));
- context.EmitCall(typeof(Sse).GetMethod(nameMov));
- context.EmitStvec(op.Rd);
- }
- else
- {
- int elems = 8 >> op.Size;
- int part = op.RegisterSize == RegisterSize.Simd128 ? elems : 0;
- if (part != 0)
- {
- context.EmitLdvec(op.Rd);
- context.EmitStvectmp();
- }
- for (int index = 0; index < elems; index++)
- {
- EmitVectorExtractZx(context, op.Rn, index, op.Size + 1);
- EmitVectorInsertTmp(context, part + index, op.Size);
- }
- context.EmitLdvectmp();
- context.EmitStvec(op.Rd);
- if (part == 0)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- }
- public static void Zip1_V(ILEmitterCtx context)
- {
- EmitVectorZip(context, part: 0);
- }
- public static void Zip2_V(ILEmitterCtx context)
- {
- EmitVectorZip(context, part: 1);
- }
- private static void EmitMoviMvni(ILEmitterCtx context, bool not)
- {
- OpCodeSimdImm64 op = (OpCodeSimdImm64)context.CurrOp;
- Type[] typesSav = new Type[] { UIntTypesPerSizeLog2[op.Size] };
- long imm = op.Imm;
- if (not)
- {
- imm = ~imm;
- }
- if (op.Size < 3)
- {
- context.EmitLdc_I4((int)imm);
- }
- else
- {
- context.EmitLdc_I8(imm);
- }
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), typesSav));
- context.EmitStvec(op.Rd);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- private static void EmitVectorTranspose(ILEmitterCtx context, int part)
- {
- OpCodeSimdReg64 op = (OpCodeSimdReg64)context.CurrOp;
- if (Optimizations.UseSsse3)
- {
- Type[] typesSve = new Type[] { typeof(long), typeof(long) };
- string nameUpk = part == 0
- ? nameof(Sse2.UnpackLow)
- : nameof(Sse2.UnpackHigh);
- context.EmitLdvec(op.Rn); // value
- if (op.Size < 3)
- {
- context.EmitLdc_I8(_masksE1_TrnUzp [op.Size]); // maskE1
- context.EmitLdc_I8(_masksE0_TrnUzpXtn[op.Size]); // maskE0
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), GetTypesSflUpk(0)));
- }
- context.EmitLdvec(op.Rm); // value
- if (op.Size < 3)
- {
- context.EmitLdc_I8(_masksE1_TrnUzp [op.Size]); // maskE1
- context.EmitLdc_I8(_masksE0_TrnUzpXtn[op.Size]); // maskE0
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), GetTypesSflUpk(0)));
- }
- context.EmitCall(typeof(Sse2).GetMethod(nameUpk, GetTypesSflUpk(op.Size)));
- context.EmitStvec(op.Rd);
- }
- else
- {
- int words = op.GetBitsCount() >> 4;
- int pairs = words >> op.Size;
- for (int index = 0; index < pairs; index++)
- {
- int idx = index << 1;
- EmitVectorExtractZx(context, op.Rn, idx + part, op.Size);
- EmitVectorExtractZx(context, op.Rm, idx + part, op.Size);
- EmitVectorInsertTmp(context, idx + 1, op.Size);
- EmitVectorInsertTmp(context, idx, op.Size);
- }
- context.EmitLdvectmp();
- context.EmitStvec(op.Rd);
- }
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- private static void EmitVectorUnzip(ILEmitterCtx context, int part)
- {
- OpCodeSimdReg64 op = (OpCodeSimdReg64)context.CurrOp;
- if (Optimizations.UseSsse3)
- {
- Type[] typesSve = new Type[] { typeof(long), typeof(long) };
- string nameUpk = part == 0
- ? nameof(Sse2.UnpackLow)
- : nameof(Sse2.UnpackHigh);
- if (op.RegisterSize == RegisterSize.Simd128)
- {
- context.EmitLdvec(op.Rn); // value
- if (op.Size < 3)
- {
- context.EmitLdc_I8(_masksE1_TrnUzp [op.Size]); // maskE1
- context.EmitLdc_I8(_masksE0_TrnUzpXtn[op.Size]); // maskE0
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), GetTypesSflUpk(0)));
- }
- context.EmitLdvec(op.Rm); // value
- if (op.Size < 3)
- {
- context.EmitLdc_I8(_masksE1_TrnUzp [op.Size]); // maskE1
- context.EmitLdc_I8(_masksE0_TrnUzpXtn[op.Size]); // maskE0
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), GetTypesSflUpk(0)));
- }
- context.EmitCall(typeof(Sse2).GetMethod(nameUpk, GetTypesSflUpk(3)));
- context.EmitStvec(op.Rd);
- }
- else
- {
- context.EmitLdvec(op.Rn);
- context.EmitLdvec(op.Rm);
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.UnpackLow), GetTypesSflUpk(op.Size))); // value
- if (op.Size < 2)
- {
- context.EmitLdc_I8(_masksE1_Uzp[op.Size]); // maskE1
- context.EmitLdc_I8(_masksE0_Uzp[op.Size]); // maskE0
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
- context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), GetTypesSflUpk(0)));
- }
- VectorHelper.EmitCall(context, nameof(VectorHelper.VectorSingleZero));
- context.EmitCall(typeof(Sse2).GetMethod(nameUpk, GetTypesSflUpk(3)));
- context.EmitStvec(op.Rd);
- }
- }
- else
- {
- int words = op.GetBitsCount() >> 4;
- int pairs = words >> op.Size;
- for (int index = 0; index < pairs; index++)
- {
- int idx = index << 1;
- EmitVectorExtractZx(context, op.Rn, idx + part, op.Size);
- EmitVectorExtractZx(context, op.Rm, idx + part, op.Size);
- EmitVectorInsertTmp(context, pairs + index, op.Size);
- EmitVectorInsertTmp(context, index, op.Size);
- }
- context.EmitLdvectmp();
- context.EmitStvec(op.Rd);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- }
- private static void EmitVectorZip(ILEmitterCtx context, int part)
- {
- OpCodeSimdReg64 op = (OpCodeSimdReg64)context.CurrOp;
- if (Optimizations.UseSse2)
- {
- string nameUpk = part == 0
- ? nameof(Sse2.UnpackLow)
- : nameof(Sse2.UnpackHigh);
- context.EmitLdvec(op.Rn);
- context.EmitLdvec(op.Rm);
- if (op.RegisterSize == RegisterSize.Simd128)
- {
- context.EmitCall(typeof(Sse2).GetMethod(nameUpk, GetTypesSflUpk(op.Size)));
- }
- else
- {
- context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.UnpackLow), GetTypesSflUpk(op.Size)));
- VectorHelper.EmitCall(context, nameof(VectorHelper.VectorSingleZero));
- context.EmitCall(typeof(Sse2).GetMethod(nameUpk, GetTypesSflUpk(3)));
- }
- context.EmitStvec(op.Rd);
- }
- else
- {
- int words = op.GetBitsCount() >> 4;
- int pairs = words >> op.Size;
- int Base = part != 0 ? pairs : 0;
- for (int index = 0; index < pairs; index++)
- {
- int idx = index << 1;
- EmitVectorExtractZx(context, op.Rn, Base + index, op.Size);
- EmitVectorExtractZx(context, op.Rm, Base + index, op.Size);
- EmitVectorInsertTmp(context, idx + 1, op.Size);
- EmitVectorInsertTmp(context, idx, op.Size);
- }
- context.EmitLdvectmp();
- context.EmitStvec(op.Rd);
- if (op.RegisterSize == RegisterSize.Simd64)
- {
- EmitVectorZeroUpper(context, op.Rd);
- }
- }
- }
- private static Type[] GetTypesSflUpk(int size)
- {
- return new Type[] { VectorIntTypesPerSizeLog2[size], VectorIntTypesPerSizeLog2[size] };
- }
- }
- }
|