InstEmitSimdLogical.cs 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437
  1. using ChocolArm64.Decoders;
  2. using ChocolArm64.State;
  3. using ChocolArm64.Translation;
  4. using System;
  5. using System.Reflection.Emit;
  6. using System.Runtime.Intrinsics;
  7. using System.Runtime.Intrinsics.X86;
  8. using static ChocolArm64.Instructions.InstEmitSimdHelper;
  9. namespace ChocolArm64.Instructions
  10. {
  11. static partial class InstEmit
  12. {
  13. public static void And_V(ILEmitterCtx context)
  14. {
  15. if (Optimizations.UseSse2)
  16. {
  17. EmitSse2Op(context, nameof(Sse2.And));
  18. }
  19. else
  20. {
  21. EmitVectorBinaryOpZx(context, () => context.Emit(OpCodes.And));
  22. }
  23. }
  24. public static void Bic_V(ILEmitterCtx context)
  25. {
  26. if (Optimizations.UseSse2)
  27. {
  28. OpCodeSimdReg64 op = (OpCodeSimdReg64)context.CurrOp;
  29. Type[] typesAnt = new Type[] { typeof(Vector128<byte>), typeof(Vector128<byte>) };
  30. context.EmitLdvec(op.Rm);
  31. context.EmitLdvec(op.Rn);
  32. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.AndNot), typesAnt));
  33. context.EmitStvec(op.Rd);
  34. if (op.RegisterSize == RegisterSize.Simd64)
  35. {
  36. EmitVectorZeroUpper(context, op.Rd);
  37. }
  38. }
  39. else
  40. {
  41. EmitVectorBinaryOpZx(context, () =>
  42. {
  43. context.Emit(OpCodes.Not);
  44. context.Emit(OpCodes.And);
  45. });
  46. }
  47. }
  48. public static void Bic_Vi(ILEmitterCtx context)
  49. {
  50. EmitVectorImmBinaryOp(context, () =>
  51. {
  52. context.Emit(OpCodes.Not);
  53. context.Emit(OpCodes.And);
  54. });
  55. }
  56. public static void Bif_V(ILEmitterCtx context)
  57. {
  58. EmitBifBit(context, notRm: true);
  59. }
  60. public static void Bit_V(ILEmitterCtx context)
  61. {
  62. EmitBifBit(context, notRm: false);
  63. }
  64. private static void EmitBifBit(ILEmitterCtx context, bool notRm)
  65. {
  66. OpCodeSimdReg64 op = (OpCodeSimdReg64)context.CurrOp;
  67. if (Optimizations.UseSse2)
  68. {
  69. Type[] typesXorAnd = new Type[] { typeof(Vector128<byte>), typeof(Vector128<byte>) };
  70. string nameAnd = notRm ? nameof(Sse2.AndNot) : nameof(Sse2.And);
  71. context.EmitLdvec(op.Rd);
  72. context.EmitLdvec(op.Rm);
  73. context.EmitLdvec(op.Rn);
  74. context.EmitLdvec(op.Rd);
  75. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Xor), typesXorAnd));
  76. context.EmitCall(typeof(Sse2).GetMethod(nameAnd, typesXorAnd));
  77. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Xor), typesXorAnd));
  78. context.EmitStvec(op.Rd);
  79. if (op.RegisterSize == RegisterSize.Simd64)
  80. {
  81. EmitVectorZeroUpper(context, op.Rd);
  82. }
  83. }
  84. else
  85. {
  86. int elems = op.RegisterSize == RegisterSize.Simd128 ? 2 : 1;
  87. for (int index = 0; index < elems; index++)
  88. {
  89. EmitVectorExtractZx(context, op.Rd, index, 3);
  90. context.Emit(OpCodes.Dup);
  91. EmitVectorExtractZx(context, op.Rn, index, 3);
  92. context.Emit(OpCodes.Xor);
  93. EmitVectorExtractZx(context, op.Rm, index, 3);
  94. if (notRm)
  95. {
  96. context.Emit(OpCodes.Not);
  97. }
  98. context.Emit(OpCodes.And);
  99. context.Emit(OpCodes.Xor);
  100. EmitVectorInsert(context, op.Rd, index, 3);
  101. }
  102. if (op.RegisterSize == RegisterSize.Simd64)
  103. {
  104. EmitVectorZeroUpper(context, op.Rd);
  105. }
  106. }
  107. }
  108. public static void Bsl_V(ILEmitterCtx context)
  109. {
  110. if (Optimizations.UseSse2)
  111. {
  112. OpCodeSimdReg64 op = (OpCodeSimdReg64)context.CurrOp;
  113. Type[] typesXorAnd = new Type[] { typeof(Vector128<byte>), typeof(Vector128<byte>) };
  114. context.EmitLdvec(op.Rm);
  115. context.EmitLdvec(op.Rm);
  116. context.EmitLdvec(op.Rn);
  117. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Xor), typesXorAnd));
  118. context.EmitLdvec(op.Rd);
  119. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.And), typesXorAnd));
  120. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Xor), typesXorAnd));
  121. context.EmitStvec(op.Rd);
  122. if (op.RegisterSize == RegisterSize.Simd64)
  123. {
  124. EmitVectorZeroUpper(context, op.Rd);
  125. }
  126. }
  127. else
  128. {
  129. EmitVectorTernaryOpZx(context, () =>
  130. {
  131. context.EmitSttmp();
  132. context.EmitLdtmp();
  133. context.Emit(OpCodes.Xor);
  134. context.Emit(OpCodes.And);
  135. context.EmitLdtmp();
  136. context.Emit(OpCodes.Xor);
  137. });
  138. }
  139. }
  140. public static void Eor_V(ILEmitterCtx context)
  141. {
  142. if (Optimizations.UseSse2)
  143. {
  144. EmitSse2Op(context, nameof(Sse2.Xor));
  145. }
  146. else
  147. {
  148. EmitVectorBinaryOpZx(context, () => context.Emit(OpCodes.Xor));
  149. }
  150. }
  151. public static void Not_V(ILEmitterCtx context)
  152. {
  153. if (Optimizations.UseSse2)
  154. {
  155. OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
  156. Type[] typesSav = new Type[] { typeof(long) };
  157. Type[] typesAnt = new Type[] { typeof(Vector128<long>), typeof(Vector128<long>) };
  158. context.EmitLdvec(op.Rn);
  159. context.EmitLdc_I8(-1L);
  160. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), typesSav));
  161. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.AndNot), typesAnt));
  162. context.EmitStvec(op.Rd);
  163. if (op.RegisterSize == RegisterSize.Simd64)
  164. {
  165. EmitVectorZeroUpper(context, op.Rd);
  166. }
  167. }
  168. else
  169. {
  170. EmitVectorUnaryOpZx(context, () => context.Emit(OpCodes.Not));
  171. }
  172. }
  173. public static void Orn_V(ILEmitterCtx context)
  174. {
  175. if (Optimizations.UseSse2)
  176. {
  177. OpCodeSimdReg64 op = (OpCodeSimdReg64)context.CurrOp;
  178. Type[] typesSav = new Type[] { typeof(long) };
  179. Type[] typesAntOr = new Type[] { typeof(Vector128<long>), typeof(Vector128<long>) };
  180. context.EmitLdvec(op.Rn);
  181. context.EmitLdvec(op.Rm);
  182. context.EmitLdc_I8(-1L);
  183. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), typesSav));
  184. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.AndNot), typesAntOr));
  185. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Or), typesAntOr));
  186. context.EmitStvec(op.Rd);
  187. if (op.RegisterSize == RegisterSize.Simd64)
  188. {
  189. EmitVectorZeroUpper(context, op.Rd);
  190. }
  191. }
  192. else
  193. {
  194. EmitVectorBinaryOpZx(context, () =>
  195. {
  196. context.Emit(OpCodes.Not);
  197. context.Emit(OpCodes.Or);
  198. });
  199. }
  200. }
  201. public static void Orr_V(ILEmitterCtx context)
  202. {
  203. if (Optimizations.UseSse2)
  204. {
  205. EmitSse2Op(context, nameof(Sse2.Or));
  206. }
  207. else
  208. {
  209. EmitVectorBinaryOpZx(context, () => context.Emit(OpCodes.Or));
  210. }
  211. }
  212. public static void Orr_Vi(ILEmitterCtx context)
  213. {
  214. EmitVectorImmBinaryOp(context, () => context.Emit(OpCodes.Or));
  215. }
  216. public static void Rbit_V(ILEmitterCtx context)
  217. {
  218. OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
  219. int elems = op.RegisterSize == RegisterSize.Simd128 ? 16 : 8;
  220. for (int index = 0; index < elems; index++)
  221. {
  222. EmitVectorExtractZx(context, op.Rn, index, 0);
  223. context.Emit(OpCodes.Conv_U4);
  224. SoftFallback.EmitCall(context, nameof(SoftFallback.ReverseBits8));
  225. context.Emit(OpCodes.Conv_U8);
  226. EmitVectorInsert(context, op.Rd, index, 0);
  227. }
  228. if (op.RegisterSize == RegisterSize.Simd64)
  229. {
  230. EmitVectorZeroUpper(context, op.Rd);
  231. }
  232. }
  233. public static void Rev16_V(ILEmitterCtx context)
  234. {
  235. if (Optimizations.UseSsse3)
  236. {
  237. OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
  238. Type[] typesSve = new Type[] { typeof(long), typeof(long) };
  239. Type[] typesSfl = new Type[] { typeof(Vector128<sbyte>), typeof(Vector128<sbyte>) };
  240. context.EmitLdvec(op.Rn); // value
  241. context.EmitLdc_I8(14L << 56 | 15L << 48 | 12L << 40 | 13L << 32 | 10L << 24 | 11L << 16 | 08L << 8 | 09L << 0); // maskE1
  242. context.EmitLdc_I8(06L << 56 | 07L << 48 | 04L << 40 | 05L << 32 | 02L << 24 | 03L << 16 | 00L << 8 | 01L << 0); // maskE0
  243. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
  244. context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), typesSfl));
  245. context.EmitStvec(op.Rd);
  246. if (op.RegisterSize == RegisterSize.Simd64)
  247. {
  248. EmitVectorZeroUpper(context, op.Rd);
  249. }
  250. }
  251. else
  252. {
  253. EmitRev_V(context, containerSize: 1);
  254. }
  255. }
  256. public static void Rev32_V(ILEmitterCtx context)
  257. {
  258. if (Optimizations.UseSsse3)
  259. {
  260. OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
  261. Type[] typesSve = new Type[] { typeof(long), typeof(long) };
  262. Type[] typesSfl = new Type[] { typeof(Vector128<sbyte>), typeof(Vector128<sbyte>) };
  263. context.EmitLdvec(op.Rn); // value
  264. if (op.Size == 0)
  265. {
  266. context.EmitLdc_I8(12L << 56 | 13L << 48 | 14L << 40 | 15L << 32 | 08L << 24 | 09L << 16 | 10L << 8 | 11L << 0); // maskE1
  267. context.EmitLdc_I8(04L << 56 | 05L << 48 | 06L << 40 | 07L << 32 | 00L << 24 | 01L << 16 | 02L << 8 | 03L << 0); // maskE0
  268. }
  269. else /* if (op.Size == 1) */
  270. {
  271. context.EmitLdc_I8(13L << 56 | 12L << 48 | 15L << 40 | 14L << 32 | 09L << 24 | 08L << 16 | 11L << 8 | 10L << 0); // maskE1
  272. context.EmitLdc_I8(05L << 56 | 04L << 48 | 07L << 40 | 06L << 32 | 01L << 24 | 00L << 16 | 03L << 8 | 02L << 0); // maskE0
  273. }
  274. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
  275. context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), typesSfl));
  276. context.EmitStvec(op.Rd);
  277. if (op.RegisterSize == RegisterSize.Simd64)
  278. {
  279. EmitVectorZeroUpper(context, op.Rd);
  280. }
  281. }
  282. else
  283. {
  284. EmitRev_V(context, containerSize: 2);
  285. }
  286. }
  287. public static void Rev64_V(ILEmitterCtx context)
  288. {
  289. if (Optimizations.UseSsse3)
  290. {
  291. OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
  292. Type[] typesSve = new Type[] { typeof(long), typeof(long) };
  293. Type[] typesSfl = new Type[] { typeof(Vector128<sbyte>), typeof(Vector128<sbyte>) };
  294. context.EmitLdvec(op.Rn); // value
  295. if (op.Size == 0)
  296. {
  297. context.EmitLdc_I8(08L << 56 | 09L << 48 | 10L << 40 | 11L << 32 | 12L << 24 | 13L << 16 | 14L << 8 | 15L << 0); // maskE1
  298. context.EmitLdc_I8(00L << 56 | 01L << 48 | 02L << 40 | 03L << 32 | 04L << 24 | 05L << 16 | 06L << 8 | 07L << 0); // maskE0
  299. }
  300. else if (op.Size == 1)
  301. {
  302. context.EmitLdc_I8(09L << 56 | 08L << 48 | 11L << 40 | 10L << 32 | 13L << 24 | 12L << 16 | 15L << 8 | 14L << 0); // maskE1
  303. context.EmitLdc_I8(01L << 56 | 00L << 48 | 03L << 40 | 02L << 32 | 05L << 24 | 04L << 16 | 07L << 8 | 06L << 0); // maskE0
  304. }
  305. else /* if (op.Size == 2) */
  306. {
  307. context.EmitLdc_I8(11L << 56 | 10L << 48 | 09L << 40 | 08L << 32 | 15L << 24 | 14L << 16 | 13L << 8 | 12L << 0); // maskE1
  308. context.EmitLdc_I8(03L << 56 | 02L << 48 | 01L << 40 | 00L << 32 | 07L << 24 | 06L << 16 | 05L << 8 | 04L << 0); // maskE0
  309. }
  310. context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetVector128), typesSve));
  311. context.EmitCall(typeof(Ssse3).GetMethod(nameof(Ssse3.Shuffle), typesSfl));
  312. context.EmitStvec(op.Rd);
  313. if (op.RegisterSize == RegisterSize.Simd64)
  314. {
  315. EmitVectorZeroUpper(context, op.Rd);
  316. }
  317. }
  318. else
  319. {
  320. EmitRev_V(context, containerSize: 3);
  321. }
  322. }
  323. private static void EmitRev_V(ILEmitterCtx context, int containerSize)
  324. {
  325. OpCodeSimd64 op = (OpCodeSimd64)context.CurrOp;
  326. int bytes = op.GetBitsCount() >> 3;
  327. int elems = bytes >> op.Size;
  328. int containerMask = (1 << (containerSize - op.Size)) - 1;
  329. for (int index = 0; index < elems; index++)
  330. {
  331. int revIndex = index ^ containerMask;
  332. EmitVectorExtractZx(context, op.Rn, revIndex, op.Size);
  333. EmitVectorInsertTmp(context, index, op.Size);
  334. }
  335. context.EmitLdvectmp();
  336. context.EmitStvec(op.Rd);
  337. if (op.RegisterSize == RegisterSize.Simd64)
  338. {
  339. EmitVectorZeroUpper(context, op.Rd);
  340. }
  341. }
  342. }
  343. }