AInstEmitSimdShift.cs 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591
  1. using ChocolArm64.Decoder;
  2. using ChocolArm64.State;
  3. using ChocolArm64.Translation;
  4. using System;
  5. using System.Reflection.Emit;
  6. using static ChocolArm64.Instruction.AInstEmitSimdHelper;
  7. namespace ChocolArm64.Instruction
  8. {
  9. static partial class AInstEmit
  10. {
  11. public static void Rshrn_V(AILEmitterCtx Context)
  12. {
  13. EmitVectorShrImmNarrowOpZx(Context, Round: true);
  14. }
  15. public static void Shl_S(AILEmitterCtx Context)
  16. {
  17. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  18. EmitScalarUnaryOpZx(Context, () =>
  19. {
  20. Context.EmitLdc_I4(GetImmShl(Op));
  21. Context.Emit(OpCodes.Shl);
  22. });
  23. }
  24. public static void Shl_V(AILEmitterCtx Context)
  25. {
  26. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  27. EmitVectorUnaryOpZx(Context, () =>
  28. {
  29. Context.EmitLdc_I4(GetImmShl(Op));
  30. Context.Emit(OpCodes.Shl);
  31. });
  32. }
  33. public static void Shll_V(AILEmitterCtx Context)
  34. {
  35. AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
  36. int Shift = 8 << Op.Size;
  37. EmitVectorShImmWidenBinaryZx(Context, () => Context.Emit(OpCodes.Shl), Shift);
  38. }
  39. public static void Shrn_V(AILEmitterCtx Context)
  40. {
  41. EmitVectorShrImmNarrowOpZx(Context, Round: false);
  42. }
  43. public static void Sli_V(AILEmitterCtx Context)
  44. {
  45. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  46. int Bytes = Op.GetBitsCount() >> 3;
  47. int Elems = Bytes >> Op.Size;
  48. int Shift = GetImmShl(Op);
  49. ulong Mask = Shift != 0 ? ulong.MaxValue >> (64 - Shift) : 0;
  50. for (int Index = 0; Index < Elems; Index++)
  51. {
  52. EmitVectorExtractZx(Context, Op.Rn, Index, Op.Size);
  53. Context.EmitLdc_I4(Shift);
  54. Context.Emit(OpCodes.Shl);
  55. EmitVectorExtractZx(Context, Op.Rd, Index, Op.Size);
  56. Context.EmitLdc_I8((long)Mask);
  57. Context.Emit(OpCodes.And);
  58. Context.Emit(OpCodes.Or);
  59. EmitVectorInsert(Context, Op.Rd, Index, Op.Size);
  60. }
  61. if (Op.RegisterSize == ARegisterSize.SIMD64)
  62. {
  63. EmitVectorZeroUpper(Context, Op.Rd);
  64. }
  65. }
  66. public static void Sqrshrn_S(AILEmitterCtx Context)
  67. {
  68. EmitRoundShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.ScalarSxSx);
  69. }
  70. public static void Sqrshrn_V(AILEmitterCtx Context)
  71. {
  72. EmitRoundShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.VectorSxSx);
  73. }
  74. public static void Sqrshrun_S(AILEmitterCtx Context)
  75. {
  76. EmitRoundShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.ScalarSxZx);
  77. }
  78. public static void Sqrshrun_V(AILEmitterCtx Context)
  79. {
  80. EmitRoundShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.VectorSxZx);
  81. }
  82. public static void Sqshrn_S(AILEmitterCtx Context)
  83. {
  84. EmitShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.ScalarSxSx);
  85. }
  86. public static void Sqshrn_V(AILEmitterCtx Context)
  87. {
  88. EmitShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.VectorSxSx);
  89. }
  90. public static void Sqshrun_S(AILEmitterCtx Context)
  91. {
  92. EmitShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.ScalarSxZx);
  93. }
  94. public static void Sqshrun_V(AILEmitterCtx Context)
  95. {
  96. EmitShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.VectorSxZx);
  97. }
  98. public static void Srshr_S(AILEmitterCtx Context)
  99. {
  100. EmitScalarShrImmOpSx(Context, ShrImmFlags.Round);
  101. }
  102. public static void Srshr_V(AILEmitterCtx Context)
  103. {
  104. EmitVectorShrImmOpSx(Context, ShrImmFlags.Round);
  105. }
  106. public static void Srsra_S(AILEmitterCtx Context)
  107. {
  108. EmitScalarShrImmOpSx(Context, ShrImmFlags.Round | ShrImmFlags.Accumulate);
  109. }
  110. public static void Srsra_V(AILEmitterCtx Context)
  111. {
  112. EmitVectorShrImmOpSx(Context, ShrImmFlags.Round | ShrImmFlags.Accumulate);
  113. }
  114. public static void Sshl_V(AILEmitterCtx Context)
  115. {
  116. EmitVectorShl(Context, Signed: true);
  117. }
  118. public static void Sshll_V(AILEmitterCtx Context)
  119. {
  120. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  121. EmitVectorShImmWidenBinarySx(Context, () => Context.Emit(OpCodes.Shl), GetImmShl(Op));
  122. }
  123. public static void Sshr_S(AILEmitterCtx Context)
  124. {
  125. EmitShrImmOp(Context, ShrImmFlags.ScalarSx);
  126. }
  127. public static void Sshr_V(AILEmitterCtx Context)
  128. {
  129. EmitShrImmOp(Context, ShrImmFlags.VectorSx);
  130. }
  131. public static void Ssra_S(AILEmitterCtx Context)
  132. {
  133. EmitScalarShrImmOpSx(Context, ShrImmFlags.Accumulate);
  134. }
  135. public static void Ssra_V(AILEmitterCtx Context)
  136. {
  137. EmitVectorShrImmOpSx(Context, ShrImmFlags.Accumulate);
  138. }
  139. public static void Uqrshrn_S(AILEmitterCtx Context)
  140. {
  141. EmitRoundShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.ScalarZxZx);
  142. }
  143. public static void Uqrshrn_V(AILEmitterCtx Context)
  144. {
  145. EmitRoundShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.VectorZxZx);
  146. }
  147. public static void Uqshrn_S(AILEmitterCtx Context)
  148. {
  149. EmitShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.ScalarZxZx);
  150. }
  151. public static void Uqshrn_V(AILEmitterCtx Context)
  152. {
  153. EmitShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.VectorZxZx);
  154. }
  155. public static void Urshr_S(AILEmitterCtx Context)
  156. {
  157. EmitScalarShrImmOpZx(Context, ShrImmFlags.Round);
  158. }
  159. public static void Urshr_V(AILEmitterCtx Context)
  160. {
  161. EmitVectorShrImmOpZx(Context, ShrImmFlags.Round);
  162. }
  163. public static void Ursra_S(AILEmitterCtx Context)
  164. {
  165. EmitScalarShrImmOpZx(Context, ShrImmFlags.Round | ShrImmFlags.Accumulate);
  166. }
  167. public static void Ursra_V(AILEmitterCtx Context)
  168. {
  169. EmitVectorShrImmOpZx(Context, ShrImmFlags.Round | ShrImmFlags.Accumulate);
  170. }
  171. public static void Ushl_V(AILEmitterCtx Context)
  172. {
  173. EmitVectorShl(Context, Signed: false);
  174. }
  175. public static void Ushll_V(AILEmitterCtx Context)
  176. {
  177. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  178. EmitVectorShImmWidenBinaryZx(Context, () => Context.Emit(OpCodes.Shl), GetImmShl(Op));
  179. }
  180. public static void Ushr_S(AILEmitterCtx Context)
  181. {
  182. EmitShrImmOp(Context, ShrImmFlags.ScalarZx);
  183. }
  184. public static void Ushr_V(AILEmitterCtx Context)
  185. {
  186. EmitShrImmOp(Context, ShrImmFlags.VectorZx);
  187. }
  188. public static void Usra_S(AILEmitterCtx Context)
  189. {
  190. EmitScalarShrImmOpZx(Context, ShrImmFlags.Accumulate);
  191. }
  192. public static void Usra_V(AILEmitterCtx Context)
  193. {
  194. EmitVectorShrImmOpZx(Context, ShrImmFlags.Accumulate);
  195. }
  196. private static void EmitVectorShl(AILEmitterCtx Context, bool Signed)
  197. {
  198. //This instruction shifts the value on vector A by the number of bits
  199. //specified on the signed, lower 8 bits of vector B. If the shift value
  200. //is greater or equal to the data size of each lane, then the result is zero.
  201. //Additionally, negative shifts produces right shifts by the negated shift value.
  202. AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
  203. int MaxShift = 8 << Op.Size;
  204. Action Emit = () =>
  205. {
  206. AILLabel LblShl = new AILLabel();
  207. AILLabel LblZero = new AILLabel();
  208. AILLabel LblEnd = new AILLabel();
  209. void EmitShift(OpCode ILOp)
  210. {
  211. Context.Emit(OpCodes.Dup);
  212. Context.EmitLdc_I4(MaxShift);
  213. Context.Emit(OpCodes.Bge_S, LblZero);
  214. Context.Emit(ILOp);
  215. Context.Emit(OpCodes.Br_S, LblEnd);
  216. }
  217. Context.Emit(OpCodes.Conv_I1);
  218. Context.Emit(OpCodes.Dup);
  219. Context.EmitLdc_I4(0);
  220. Context.Emit(OpCodes.Bge_S, LblShl);
  221. Context.Emit(OpCodes.Neg);
  222. EmitShift(Signed
  223. ? OpCodes.Shr
  224. : OpCodes.Shr_Un);
  225. Context.MarkLabel(LblShl);
  226. EmitShift(OpCodes.Shl);
  227. Context.MarkLabel(LblZero);
  228. Context.Emit(OpCodes.Pop);
  229. Context.Emit(OpCodes.Pop);
  230. Context.EmitLdc_I8(0);
  231. Context.MarkLabel(LblEnd);
  232. };
  233. if (Signed)
  234. {
  235. EmitVectorBinaryOpSx(Context, Emit);
  236. }
  237. else
  238. {
  239. EmitVectorBinaryOpZx(Context, Emit);
  240. }
  241. }
  242. [Flags]
  243. private enum ShrImmFlags
  244. {
  245. Scalar = 1 << 0,
  246. Signed = 1 << 1,
  247. Round = 1 << 2,
  248. Accumulate = 1 << 3,
  249. ScalarSx = Scalar | Signed,
  250. ScalarZx = Scalar,
  251. VectorSx = Signed,
  252. VectorZx = 0
  253. }
  254. private static void EmitScalarShrImmOpSx(AILEmitterCtx Context, ShrImmFlags Flags)
  255. {
  256. EmitShrImmOp(Context, ShrImmFlags.ScalarSx | Flags);
  257. }
  258. private static void EmitScalarShrImmOpZx(AILEmitterCtx Context, ShrImmFlags Flags)
  259. {
  260. EmitShrImmOp(Context, ShrImmFlags.ScalarZx | Flags);
  261. }
  262. private static void EmitVectorShrImmOpSx(AILEmitterCtx Context, ShrImmFlags Flags)
  263. {
  264. EmitShrImmOp(Context, ShrImmFlags.VectorSx | Flags);
  265. }
  266. private static void EmitVectorShrImmOpZx(AILEmitterCtx Context, ShrImmFlags Flags)
  267. {
  268. EmitShrImmOp(Context, ShrImmFlags.VectorZx | Flags);
  269. }
  270. private static void EmitShrImmOp(AILEmitterCtx Context, ShrImmFlags Flags)
  271. {
  272. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  273. bool Scalar = (Flags & ShrImmFlags.Scalar) != 0;
  274. bool Signed = (Flags & ShrImmFlags.Signed) != 0;
  275. bool Round = (Flags & ShrImmFlags.Round) != 0;
  276. bool Accumulate = (Flags & ShrImmFlags.Accumulate) != 0;
  277. int Shift = GetImmShr(Op);
  278. long RoundConst = 1L << (Shift - 1);
  279. int Bytes = Op.GetBitsCount() >> 3;
  280. int Elems = !Scalar ? Bytes >> Op.Size : 1;
  281. for (int Index = 0; Index < Elems; Index++)
  282. {
  283. EmitVectorExtract(Context, Op.Rn, Index, Op.Size, Signed);
  284. if (Op.Size <= 2)
  285. {
  286. if (Round)
  287. {
  288. Context.EmitLdc_I8(RoundConst);
  289. Context.Emit(OpCodes.Add);
  290. }
  291. Context.EmitLdc_I4(Shift);
  292. Context.Emit(Signed ? OpCodes.Shr : OpCodes.Shr_Un);
  293. }
  294. else /* if (Op.Size == 3) */
  295. {
  296. EmitShrImm_64(Context, Signed, Round ? RoundConst : 0L, Shift);
  297. }
  298. if (Accumulate)
  299. {
  300. EmitVectorExtract(Context, Op.Rd, Index, Op.Size, Signed);
  301. Context.Emit(OpCodes.Add);
  302. }
  303. EmitVectorInsertTmp(Context, Index, Op.Size);
  304. }
  305. Context.EmitLdvectmp();
  306. Context.EmitStvec(Op.Rd);
  307. if ((Op.RegisterSize == ARegisterSize.SIMD64) || Scalar)
  308. {
  309. EmitVectorZeroUpper(Context, Op.Rd);
  310. }
  311. }
  312. private static void EmitVectorShrImmNarrowOpZx(AILEmitterCtx Context, bool Round)
  313. {
  314. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  315. int Shift = GetImmShr(Op);
  316. long RoundConst = 1L << (Shift - 1);
  317. int Elems = 8 >> Op.Size;
  318. int Part = Op.RegisterSize == ARegisterSize.SIMD128 ? Elems : 0;
  319. if (Part != 0)
  320. {
  321. Context.EmitLdvec(Op.Rd);
  322. Context.EmitStvectmp();
  323. }
  324. for (int Index = 0; Index < Elems; Index++)
  325. {
  326. EmitVectorExtractZx(Context, Op.Rn, Index, Op.Size + 1);
  327. if (Round)
  328. {
  329. Context.EmitLdc_I8(RoundConst);
  330. Context.Emit(OpCodes.Add);
  331. }
  332. Context.EmitLdc_I4(Shift);
  333. Context.Emit(OpCodes.Shr_Un);
  334. EmitVectorInsertTmp(Context, Part + Index, Op.Size);
  335. }
  336. Context.EmitLdvectmp();
  337. Context.EmitStvec(Op.Rd);
  338. if (Part == 0)
  339. {
  340. EmitVectorZeroUpper(Context, Op.Rd);
  341. }
  342. }
  343. [Flags]
  344. private enum ShrImmSaturatingNarrowFlags
  345. {
  346. Scalar = 1 << 0,
  347. SignedSrc = 1 << 1,
  348. SignedDst = 1 << 2,
  349. Round = 1 << 3,
  350. ScalarSxSx = Scalar | SignedSrc | SignedDst,
  351. ScalarSxZx = Scalar | SignedSrc,
  352. ScalarZxZx = Scalar,
  353. VectorSxSx = SignedSrc | SignedDst,
  354. VectorSxZx = SignedSrc,
  355. VectorZxZx = 0
  356. }
  357. private static void EmitRoundShrImmSaturatingNarrowOp(AILEmitterCtx Context, ShrImmSaturatingNarrowFlags Flags)
  358. {
  359. EmitShrImmSaturatingNarrowOp(Context, ShrImmSaturatingNarrowFlags.Round | Flags);
  360. }
  361. private static void EmitShrImmSaturatingNarrowOp(AILEmitterCtx Context, ShrImmSaturatingNarrowFlags Flags)
  362. {
  363. AOpCodeSimdShImm Op = (AOpCodeSimdShImm)Context.CurrOp;
  364. bool Scalar = (Flags & ShrImmSaturatingNarrowFlags.Scalar) != 0;
  365. bool SignedSrc = (Flags & ShrImmSaturatingNarrowFlags.SignedSrc) != 0;
  366. bool SignedDst = (Flags & ShrImmSaturatingNarrowFlags.SignedDst) != 0;
  367. bool Round = (Flags & ShrImmSaturatingNarrowFlags.Round) != 0;
  368. int Shift = GetImmShr(Op);
  369. long RoundConst = 1L << (Shift - 1);
  370. int Elems = !Scalar ? 8 >> Op.Size : 1;
  371. int Part = !Scalar && (Op.RegisterSize == ARegisterSize.SIMD128) ? Elems : 0;
  372. if (Scalar)
  373. {
  374. EmitVectorZeroLowerTmp(Context);
  375. }
  376. if (Part != 0)
  377. {
  378. Context.EmitLdvec(Op.Rd);
  379. Context.EmitStvectmp();
  380. }
  381. for (int Index = 0; Index < Elems; Index++)
  382. {
  383. EmitVectorExtract(Context, Op.Rn, Index, Op.Size + 1, SignedSrc);
  384. if (Op.Size <= 1 || !Round)
  385. {
  386. if (Round)
  387. {
  388. Context.EmitLdc_I8(RoundConst);
  389. Context.Emit(OpCodes.Add);
  390. }
  391. Context.EmitLdc_I4(Shift);
  392. Context.Emit(SignedSrc ? OpCodes.Shr : OpCodes.Shr_Un);
  393. }
  394. else /* if (Op.Size == 2 && Round) */
  395. {
  396. EmitShrImm_64(Context, SignedSrc, RoundConst, Shift); // Shift <= 32
  397. }
  398. EmitSatQ(Context, Op.Size, SignedSrc, SignedDst);
  399. EmitVectorInsertTmp(Context, Part + Index, Op.Size);
  400. }
  401. Context.EmitLdvectmp();
  402. Context.EmitStvec(Op.Rd);
  403. if (Part == 0)
  404. {
  405. EmitVectorZeroUpper(Context, Op.Rd);
  406. }
  407. }
  408. // Dst_64 = (Int(Src_64, Signed) + RoundConst) >> Shift;
  409. private static void EmitShrImm_64(
  410. AILEmitterCtx Context,
  411. bool Signed,
  412. long RoundConst,
  413. int Shift)
  414. {
  415. Context.EmitLdc_I8(RoundConst);
  416. Context.EmitLdc_I4(Shift);
  417. ASoftFallback.EmitCall(Context, Signed
  418. ? nameof(ASoftFallback.SignedShrImm_64)
  419. : nameof(ASoftFallback.UnsignedShrImm_64));
  420. }
  421. private static void EmitVectorShImmWidenBinarySx(AILEmitterCtx Context, Action Emit, int Imm)
  422. {
  423. EmitVectorShImmWidenBinaryOp(Context, Emit, Imm, true);
  424. }
  425. private static void EmitVectorShImmWidenBinaryZx(AILEmitterCtx Context, Action Emit, int Imm)
  426. {
  427. EmitVectorShImmWidenBinaryOp(Context, Emit, Imm, false);
  428. }
  429. private static void EmitVectorShImmWidenBinaryOp(AILEmitterCtx Context, Action Emit, int Imm, bool Signed)
  430. {
  431. AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
  432. int Elems = 8 >> Op.Size;
  433. int Part = Op.RegisterSize == ARegisterSize.SIMD128 ? Elems : 0;
  434. for (int Index = 0; Index < Elems; Index++)
  435. {
  436. EmitVectorExtract(Context, Op.Rn, Part + Index, Op.Size, Signed);
  437. Context.EmitLdc_I4(Imm);
  438. Emit();
  439. EmitVectorInsertTmp(Context, Index, Op.Size + 1);
  440. }
  441. Context.EmitLdvectmp();
  442. Context.EmitStvec(Op.Rd);
  443. }
  444. }
  445. }