InstEmitHash.cs 6.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184
  1. // https://www.intel.com/content/dam/www/public/us/en/documents/white-papers/fast-crc-computation-generic-polynomials-pclmulqdq-paper.pdf
  2. using ARMeilleure.Decoders;
  3. using ARMeilleure.IntermediateRepresentation;
  4. using ARMeilleure.Translation;
  5. using static ARMeilleure.Instructions.InstEmitHelper;
  6. using static ARMeilleure.Instructions.InstEmitSimdHelper;
  7. using static ARMeilleure.IntermediateRepresentation.OperandHelper;
  8. namespace ARMeilleure.Instructions
  9. {
  10. static partial class InstEmit
  11. {
  12. public static void Crc32b(ArmEmitterContext context)
  13. {
  14. if (Optimizations.UsePclmulqdq)
  15. {
  16. EmitCrc32Optimized(context, false, 8);
  17. }
  18. else
  19. {
  20. EmitCrc32Call(context, nameof(SoftFallback.Crc32b));
  21. }
  22. }
  23. public static void Crc32h(ArmEmitterContext context)
  24. {
  25. if (Optimizations.UsePclmulqdq)
  26. {
  27. EmitCrc32Optimized(context, false, 16);
  28. }
  29. else
  30. {
  31. EmitCrc32Call(context, nameof(SoftFallback.Crc32h));
  32. }
  33. }
  34. public static void Crc32w(ArmEmitterContext context)
  35. {
  36. if (Optimizations.UsePclmulqdq)
  37. {
  38. EmitCrc32Optimized(context, false, 32);
  39. }
  40. else
  41. {
  42. EmitCrc32Call(context, nameof(SoftFallback.Crc32w));
  43. }
  44. }
  45. public static void Crc32x(ArmEmitterContext context)
  46. {
  47. if (Optimizations.UsePclmulqdq)
  48. {
  49. EmitCrc32Optimized64(context, false);
  50. }
  51. else
  52. {
  53. EmitCrc32Call(context, nameof(SoftFallback.Crc32x));
  54. }
  55. }
  56. public static void Crc32cb(ArmEmitterContext context)
  57. {
  58. if (Optimizations.UsePclmulqdq)
  59. {
  60. EmitCrc32Optimized(context, true, 8);
  61. }
  62. else
  63. {
  64. EmitCrc32Call(context, nameof(SoftFallback.Crc32cb));
  65. }
  66. }
  67. public static void Crc32ch(ArmEmitterContext context)
  68. {
  69. if (Optimizations.UsePclmulqdq)
  70. {
  71. EmitCrc32Optimized(context, true, 16);
  72. }
  73. else
  74. {
  75. EmitCrc32Call(context, nameof(SoftFallback.Crc32ch));
  76. }
  77. }
  78. public static void Crc32cw(ArmEmitterContext context)
  79. {
  80. if (Optimizations.UsePclmulqdq)
  81. {
  82. EmitCrc32Optimized(context, true, 32);
  83. }
  84. else
  85. {
  86. EmitCrc32Call(context, nameof(SoftFallback.Crc32cw));
  87. }
  88. }
  89. public static void Crc32cx(ArmEmitterContext context)
  90. {
  91. if (Optimizations.UsePclmulqdq)
  92. {
  93. EmitCrc32Optimized64(context, true);
  94. }
  95. else
  96. {
  97. EmitCrc32Call(context, nameof(SoftFallback.Crc32cx));
  98. }
  99. }
  100. private static void EmitCrc32Optimized(ArmEmitterContext context, bool castagnoli, int bitsize)
  101. {
  102. OpCodeAluBinary op = (OpCodeAluBinary)context.CurrOp;
  103. long mu = castagnoli ? 0x0DEA713F1 : 0x1F7011641; // mu' = floor(x^64/P(x))'
  104. long polynomial = castagnoli ? 0x105EC76F0 : 0x1DB710641; // P'(x) << 1
  105. Operand crc = GetIntOrZR(context, op.Rn);
  106. Operand data = GetIntOrZR(context, op.Rm);
  107. crc = context.VectorInsert(context.VectorZero(), crc, 0);
  108. switch (bitsize)
  109. {
  110. case 8: data = context.VectorInsert8(context.VectorZero(), data, 0); break;
  111. case 16: data = context.VectorInsert16(context.VectorZero(), data, 0); break;
  112. case 32: data = context.VectorInsert(context.VectorZero(), data, 0); break;
  113. }
  114. Operand tmp = context.AddIntrinsic(Intrinsic.X86Pxor, crc, data);
  115. tmp = context.AddIntrinsic(Intrinsic.X86Psllq, tmp, Const(64 - bitsize));
  116. tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, mu), Const(0));
  117. tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, polynomial), Const(0));
  118. if (bitsize < 32)
  119. {
  120. crc = context.AddIntrinsic(Intrinsic.X86Pslldq, crc, Const((64 - bitsize) / 8));
  121. tmp = context.AddIntrinsic(Intrinsic.X86Pxor, tmp, crc);
  122. }
  123. SetIntOrZR(context, op.Rd, context.VectorExtract(OperandType.I32, tmp, 2));
  124. }
  125. private static void EmitCrc32Optimized64(ArmEmitterContext context, bool castagnoli)
  126. {
  127. OpCodeAluBinary op = (OpCodeAluBinary)context.CurrOp;
  128. long mu = castagnoli ? 0x0DEA713F1 : 0x1F7011641; // mu' = floor(x^64/P(x))'
  129. long polynomial = castagnoli ? 0x105EC76F0 : 0x1DB710641; // P'(x) << 1
  130. Operand crc = GetIntOrZR(context, op.Rn);
  131. Operand data = GetIntOrZR(context, op.Rm);
  132. crc = context.VectorInsert(context.VectorZero(), crc, 0);
  133. data = context.VectorInsert(context.VectorZero(), data, 0);
  134. Operand tmp = context.AddIntrinsic(Intrinsic.X86Pxor, crc, data);
  135. Operand res = context.AddIntrinsic(Intrinsic.X86Pslldq, tmp, Const(4));
  136. tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, res, X86GetScalar(context, mu), Const(0));
  137. tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, polynomial), Const(0));
  138. tmp = context.AddIntrinsic(Intrinsic.X86Pxor, tmp, res);
  139. tmp = context.AddIntrinsic(Intrinsic.X86Psllq, tmp, Const(32));
  140. tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, mu), Const(1));
  141. tmp = context.AddIntrinsic(Intrinsic.X86Pclmulqdq, tmp, X86GetScalar(context, polynomial), Const(0));
  142. SetIntOrZR(context, op.Rd, context.VectorExtract(OperandType.I32, tmp, 2));
  143. }
  144. private static void EmitCrc32Call(ArmEmitterContext context, string name)
  145. {
  146. OpCodeAluBinary op = (OpCodeAluBinary)context.CurrOp;
  147. Operand n = GetIntOrZR(context, op.Rn);
  148. Operand m = GetIntOrZR(context, op.Rm);
  149. Operand d = context.Call(typeof(SoftFallback).GetMethod(name), n, m);
  150. SetIntOrZR(context, op.Rd, d);
  151. }
  152. }
  153. }