InstEmitSimdCmp32.cs 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437
  1. using ARMeilleure.Decoders;
  2. using ARMeilleure.IntermediateRepresentation;
  3. using ARMeilleure.State;
  4. using ARMeilleure.Translation;
  5. using System;
  6. using static ARMeilleure.Instructions.InstEmitHelper;
  7. using static ARMeilleure.Instructions.InstEmitSimdHelper;
  8. using static ARMeilleure.Instructions.InstEmitSimdHelper32;
  9. using static ARMeilleure.IntermediateRepresentation.Operand.Factory;
  10. namespace ARMeilleure.Instructions
  11. {
  12. using Func2I = Func<Operand, Operand, Operand>;
  13. static partial class InstEmit32
  14. {
  15. public static void Vceq_V(ArmEmitterContext context)
  16. {
  17. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  18. {
  19. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.Equal, false);
  20. }
  21. else if (Optimizations.FastFP && Optimizations.UseSse2)
  22. {
  23. EmitSse2OrAvxCmpOpF32(context, CmpCondition.Equal, false);
  24. }
  25. else
  26. {
  27. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareEQFpscr), false);
  28. }
  29. }
  30. public static void Vceq_I(ArmEmitterContext context)
  31. {
  32. EmitCmpOpI32(context, context.ICompareEqual, context.ICompareEqual, false, false);
  33. }
  34. public static void Vceq_Z(ArmEmitterContext context)
  35. {
  36. OpCode32Simd op = (OpCode32Simd)context.CurrOp;
  37. if (op.F)
  38. {
  39. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  40. {
  41. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.Equal, true);
  42. }
  43. else if (Optimizations.FastFP && Optimizations.UseSse2)
  44. {
  45. EmitSse2OrAvxCmpOpF32(context, CmpCondition.Equal, true);
  46. }
  47. else
  48. {
  49. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareEQFpscr), true);
  50. }
  51. }
  52. else
  53. {
  54. EmitCmpOpI32(context, context.ICompareEqual, context.ICompareEqual, true, false);
  55. }
  56. }
  57. public static void Vcge_V(ArmEmitterContext context)
  58. {
  59. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  60. {
  61. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.GreaterThanOrEqual, false);
  62. }
  63. else if (Optimizations.FastFP && Optimizations.UseAvx)
  64. {
  65. EmitSse2OrAvxCmpOpF32(context, CmpCondition.GreaterThanOrEqual, false);
  66. }
  67. else
  68. {
  69. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareGEFpscr), false);
  70. }
  71. }
  72. public static void Vcge_I(ArmEmitterContext context)
  73. {
  74. OpCode32SimdReg op = (OpCode32SimdReg)context.CurrOp;
  75. EmitCmpOpI32(context, context.ICompareGreaterOrEqual, context.ICompareGreaterOrEqualUI, false, !op.U);
  76. }
  77. public static void Vcge_Z(ArmEmitterContext context)
  78. {
  79. OpCode32Simd op = (OpCode32Simd)context.CurrOp;
  80. if (op.F)
  81. {
  82. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  83. {
  84. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.GreaterThanOrEqual, true);
  85. }
  86. else if (Optimizations.FastFP && Optimizations.UseAvx)
  87. {
  88. EmitSse2OrAvxCmpOpF32(context, CmpCondition.GreaterThanOrEqual, true);
  89. }
  90. else
  91. {
  92. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareGEFpscr), true);
  93. }
  94. }
  95. else
  96. {
  97. EmitCmpOpI32(context, context.ICompareGreaterOrEqual, context.ICompareGreaterOrEqualUI, true, true);
  98. }
  99. }
  100. public static void Vcgt_V(ArmEmitterContext context)
  101. {
  102. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  103. {
  104. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.GreaterThan, false);
  105. }
  106. else if (Optimizations.FastFP && Optimizations.UseAvx)
  107. {
  108. EmitSse2OrAvxCmpOpF32(context, CmpCondition.GreaterThan, false);
  109. }
  110. else
  111. {
  112. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareGTFpscr), false);
  113. }
  114. }
  115. public static void Vcgt_I(ArmEmitterContext context)
  116. {
  117. OpCode32SimdReg op = (OpCode32SimdReg)context.CurrOp;
  118. EmitCmpOpI32(context, context.ICompareGreater, context.ICompareGreaterUI, false, !op.U);
  119. }
  120. public static void Vcgt_Z(ArmEmitterContext context)
  121. {
  122. OpCode32Simd op = (OpCode32Simd)context.CurrOp;
  123. if (op.F)
  124. {
  125. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  126. {
  127. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.GreaterThan, true);
  128. }
  129. else if (Optimizations.FastFP && Optimizations.UseAvx)
  130. {
  131. EmitSse2OrAvxCmpOpF32(context, CmpCondition.GreaterThan, true);
  132. }
  133. else
  134. {
  135. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareGTFpscr), true);
  136. }
  137. }
  138. else
  139. {
  140. EmitCmpOpI32(context, context.ICompareGreater, context.ICompareGreaterUI, true, true);
  141. }
  142. }
  143. public static void Vcle_Z(ArmEmitterContext context)
  144. {
  145. OpCode32Simd op = (OpCode32Simd)context.CurrOp;
  146. if (op.F)
  147. {
  148. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  149. {
  150. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.LessThanOrEqual, true);
  151. }
  152. else if (Optimizations.FastFP && Optimizations.UseSse2)
  153. {
  154. EmitSse2OrAvxCmpOpF32(context, CmpCondition.LessThanOrEqual, true);
  155. }
  156. else
  157. {
  158. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareLEFpscr), true);
  159. }
  160. }
  161. else
  162. {
  163. EmitCmpOpI32(context, context.ICompareLessOrEqual, context.ICompareLessOrEqualUI, true, true);
  164. }
  165. }
  166. public static void Vclt_Z(ArmEmitterContext context)
  167. {
  168. OpCode32Simd op = (OpCode32Simd)context.CurrOp;
  169. if (op.F)
  170. {
  171. if (Optimizations.FastFP && Optimizations.UseAdvSimd)
  172. {
  173. InstEmitSimdHelper32Arm64.EmitCmpOpF32(context, CmpCondition.LessThan, true);
  174. }
  175. else if (Optimizations.FastFP && Optimizations.UseSse2)
  176. {
  177. EmitSse2OrAvxCmpOpF32(context, CmpCondition.LessThan, true);
  178. }
  179. else
  180. {
  181. EmitCmpOpF32(context, nameof(SoftFloat32.FPCompareLTFpscr), true);
  182. }
  183. }
  184. else
  185. {
  186. EmitCmpOpI32(context, context.ICompareLess, context.ICompareLessUI, true, true);
  187. }
  188. }
  189. private static void EmitCmpOpF32(ArmEmitterContext context, string name, bool zero)
  190. {
  191. if (zero)
  192. {
  193. EmitVectorUnaryOpF32(context, (m) =>
  194. {
  195. Operand zeroOp = m.Type == OperandType.FP64 ? ConstF(0.0d) : ConstF(0.0f);
  196. return EmitSoftFloatCallDefaultFpscr(context, name, m, zeroOp);
  197. });
  198. }
  199. else
  200. {
  201. EmitVectorBinaryOpF32(context, (n, m) =>
  202. {
  203. return EmitSoftFloatCallDefaultFpscr(context, name, n, m);
  204. });
  205. }
  206. }
  207. private static Operand ZerosOrOnes(ArmEmitterContext context, Operand fromBool, OperandType baseType)
  208. {
  209. var ones = (baseType == OperandType.I64) ? Const(-1L) : Const(-1);
  210. return context.ConditionalSelect(fromBool, ones, Const(baseType, 0L));
  211. }
  212. private static void EmitCmpOpI32(
  213. ArmEmitterContext context,
  214. Func2I signedOp,
  215. Func2I unsignedOp,
  216. bool zero,
  217. bool signed)
  218. {
  219. if (zero)
  220. {
  221. if (signed)
  222. {
  223. EmitVectorUnaryOpSx32(context, (m) =>
  224. {
  225. OperandType type = m.Type;
  226. Operand zeroV = (type == OperandType.I64) ? Const(0L) : Const(0);
  227. return ZerosOrOnes(context, signedOp(m, zeroV), type);
  228. });
  229. }
  230. else
  231. {
  232. EmitVectorUnaryOpZx32(context, (m) =>
  233. {
  234. OperandType type = m.Type;
  235. Operand zeroV = (type == OperandType.I64) ? Const(0L) : Const(0);
  236. return ZerosOrOnes(context, unsignedOp(m, zeroV), type);
  237. });
  238. }
  239. }
  240. else
  241. {
  242. if (signed)
  243. {
  244. EmitVectorBinaryOpSx32(context, (n, m) => ZerosOrOnes(context, signedOp(n, m), n.Type));
  245. }
  246. else
  247. {
  248. EmitVectorBinaryOpZx32(context, (n, m) => ZerosOrOnes(context, unsignedOp(n, m), n.Type));
  249. }
  250. }
  251. }
  252. public static void Vcmp(ArmEmitterContext context)
  253. {
  254. if (Optimizations.UseAdvSimd)
  255. {
  256. InstEmitSimdHelper32Arm64.EmitVcmpOrVcmpe(context, false);
  257. }
  258. else
  259. {
  260. EmitVcmpOrVcmpe(context, false);
  261. }
  262. }
  263. public static void Vcmpe(ArmEmitterContext context)
  264. {
  265. if (Optimizations.UseAdvSimd)
  266. {
  267. InstEmitSimdHelper32Arm64.EmitVcmpOrVcmpe(context, true);
  268. }
  269. else
  270. {
  271. EmitVcmpOrVcmpe(context, true);
  272. }
  273. }
  274. private static void EmitVcmpOrVcmpe(ArmEmitterContext context, bool signalNaNs)
  275. {
  276. OpCode32SimdS op = (OpCode32SimdS)context.CurrOp;
  277. bool cmpWithZero = (op.Opc & 2) != 0;
  278. int sizeF = op.Size & 1;
  279. if (Optimizations.FastFP && (signalNaNs ? Optimizations.UseAvx : Optimizations.UseSse2))
  280. {
  281. CmpCondition cmpOrdered = signalNaNs ? CmpCondition.OrderedS : CmpCondition.OrderedQ;
  282. bool doubleSize = sizeF != 0;
  283. int shift = doubleSize ? 1 : 2;
  284. Operand m = GetVecA32(op.Vm >> shift);
  285. Operand n = GetVecA32(op.Vd >> shift);
  286. n = EmitSwapScalar(context, n, op.Vd, doubleSize);
  287. m = cmpWithZero ? context.VectorZero() : EmitSwapScalar(context, m, op.Vm, doubleSize);
  288. Operand lblNaN = Label();
  289. Operand lblEnd = Label();
  290. if (!doubleSize)
  291. {
  292. Operand ordMask = context.AddIntrinsic(Intrinsic.X86Cmpss, n, m, Const((int)cmpOrdered));
  293. Operand isOrdered = context.AddIntrinsicInt(Intrinsic.X86Cvtsi2si, ordMask);
  294. context.BranchIfFalse(lblNaN, isOrdered);
  295. Operand cf = context.AddIntrinsicInt(Intrinsic.X86Comissge, n, m);
  296. Operand zf = context.AddIntrinsicInt(Intrinsic.X86Comisseq, n, m);
  297. Operand nf = context.AddIntrinsicInt(Intrinsic.X86Comisslt, n, m);
  298. SetFpFlag(context, FPState.VFlag, Const(0));
  299. SetFpFlag(context, FPState.CFlag, cf);
  300. SetFpFlag(context, FPState.ZFlag, zf);
  301. SetFpFlag(context, FPState.NFlag, nf);
  302. }
  303. else
  304. {
  305. Operand ordMask = context.AddIntrinsic(Intrinsic.X86Cmpsd, n, m, Const((int)cmpOrdered));
  306. Operand isOrdered = context.AddIntrinsicLong(Intrinsic.X86Cvtsi2si, ordMask);
  307. context.BranchIfFalse(lblNaN, isOrdered);
  308. Operand cf = context.AddIntrinsicInt(Intrinsic.X86Comisdge, n, m);
  309. Operand zf = context.AddIntrinsicInt(Intrinsic.X86Comisdeq, n, m);
  310. Operand nf = context.AddIntrinsicInt(Intrinsic.X86Comisdlt, n, m);
  311. SetFpFlag(context, FPState.VFlag, Const(0));
  312. SetFpFlag(context, FPState.CFlag, cf);
  313. SetFpFlag(context, FPState.ZFlag, zf);
  314. SetFpFlag(context, FPState.NFlag, nf);
  315. }
  316. context.Branch(lblEnd);
  317. context.MarkLabel(lblNaN);
  318. SetFpFlag(context, FPState.VFlag, Const(1));
  319. SetFpFlag(context, FPState.CFlag, Const(1));
  320. SetFpFlag(context, FPState.ZFlag, Const(0));
  321. SetFpFlag(context, FPState.NFlag, Const(0));
  322. context.MarkLabel(lblEnd);
  323. }
  324. else
  325. {
  326. OperandType type = sizeF != 0 ? OperandType.FP64 : OperandType.FP32;
  327. Operand ne = ExtractScalar(context, type, op.Vd);
  328. Operand me;
  329. if (cmpWithZero)
  330. {
  331. me = sizeF == 0 ? ConstF(0f) : ConstF(0d);
  332. }
  333. else
  334. {
  335. me = ExtractScalar(context, type, op.Vm);
  336. }
  337. Operand nzcv = EmitSoftFloatCall(context, nameof(SoftFloat32.FPCompare), ne, me, Const(signalNaNs));
  338. EmitSetFpscrNzcv(context, nzcv);
  339. }
  340. }
  341. private static void EmitSetFpscrNzcv(ArmEmitterContext context, Operand nzcv)
  342. {
  343. Operand Extract(Operand value, int bit)
  344. {
  345. if (bit != 0)
  346. {
  347. value = context.ShiftRightUI(value, Const(bit));
  348. }
  349. value = context.BitwiseAnd(value, Const(1));
  350. return value;
  351. }
  352. SetFpFlag(context, FPState.VFlag, Extract(nzcv, 0));
  353. SetFpFlag(context, FPState.CFlag, Extract(nzcv, 1));
  354. SetFpFlag(context, FPState.ZFlag, Extract(nzcv, 2));
  355. SetFpFlag(context, FPState.NFlag, Extract(nzcv, 3));
  356. }
  357. private static void EmitSse2OrAvxCmpOpF32(ArmEmitterContext context, CmpCondition cond, bool zero)
  358. {
  359. OpCode32Simd op = (OpCode32Simd)context.CurrOp;
  360. int sizeF = op.Size & 1;
  361. Intrinsic inst = (sizeF == 0) ? Intrinsic.X86Cmpps : Intrinsic.X86Cmppd;
  362. if (zero)
  363. {
  364. EmitVectorUnaryOpSimd32(context, (m) =>
  365. {
  366. return context.AddIntrinsic(inst, m, context.VectorZero(), Const((int)cond));
  367. });
  368. }
  369. else
  370. {
  371. EmitVectorBinaryOpSimd32(context, (n, m) =>
  372. {
  373. return context.AddIntrinsic(inst, n, m, Const((int)cond));
  374. });
  375. }
  376. }
  377. }
  378. }