RegisterUsage.cs 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394
  1. using ARMeilleure.IntermediateRepresentation;
  2. using ARMeilleure.State;
  3. using System;
  4. using System.Numerics;
  5. using System.Runtime.Intrinsics;
  6. using System.Runtime.Intrinsics.X86;
  7. using static ARMeilleure.IntermediateRepresentation.Operand.Factory;
  8. using static ARMeilleure.IntermediateRepresentation.Operation.Factory;
  9. namespace ARMeilleure.Translation
  10. {
  11. static class RegisterUsage
  12. {
  13. private const int RegsCount = 32;
  14. private const int RegsMask = RegsCount - 1;
  15. private readonly struct RegisterMask : IEquatable<RegisterMask>
  16. {
  17. public long IntMask => Mask.GetElement(0);
  18. public long VecMask => Mask.GetElement(1);
  19. public Vector128<long> Mask { get; }
  20. public RegisterMask(Vector128<long> mask)
  21. {
  22. Mask = mask;
  23. }
  24. public RegisterMask(long intMask, long vecMask)
  25. {
  26. Mask = Vector128.Create(intMask, vecMask);
  27. }
  28. public static RegisterMask operator &(RegisterMask x, RegisterMask y)
  29. {
  30. if (Sse2.IsSupported)
  31. {
  32. return new RegisterMask(Sse2.And(x.Mask, y.Mask));
  33. }
  34. return new RegisterMask(x.IntMask & y.IntMask, x.VecMask & y.VecMask);
  35. }
  36. public static RegisterMask operator |(RegisterMask x, RegisterMask y)
  37. {
  38. if (Sse2.IsSupported)
  39. {
  40. return new RegisterMask(Sse2.Or(x.Mask, y.Mask));
  41. }
  42. return new RegisterMask(x.IntMask | y.IntMask, x.VecMask | y.VecMask);
  43. }
  44. public static RegisterMask operator ~(RegisterMask x)
  45. {
  46. if (Sse2.IsSupported)
  47. {
  48. return new RegisterMask(Sse2.AndNot(x.Mask, Vector128<long>.AllBitsSet));
  49. }
  50. return new RegisterMask(~x.IntMask, ~x.VecMask);
  51. }
  52. public static bool operator ==(RegisterMask x, RegisterMask y)
  53. {
  54. return x.Equals(y);
  55. }
  56. public static bool operator !=(RegisterMask x, RegisterMask y)
  57. {
  58. return !x.Equals(y);
  59. }
  60. public override bool Equals(object obj)
  61. {
  62. return obj is RegisterMask regMask && Equals(regMask);
  63. }
  64. public bool Equals(RegisterMask other)
  65. {
  66. return Mask.Equals(other.Mask);
  67. }
  68. public override int GetHashCode()
  69. {
  70. return Mask.GetHashCode();
  71. }
  72. }
  73. public static void RunPass(ControlFlowGraph cfg, ExecutionMode mode)
  74. {
  75. // Compute local register inputs and outputs used inside blocks.
  76. RegisterMask[] localInputs = new RegisterMask[cfg.Blocks.Count];
  77. RegisterMask[] localOutputs = new RegisterMask[cfg.Blocks.Count];
  78. for (BasicBlock block = cfg.Blocks.First; block != null; block = block.ListNext)
  79. {
  80. for (Operation node = block.Operations.First; node != default; node = node.ListNext)
  81. {
  82. for (int index = 0; index < node.SourcesCount; index++)
  83. {
  84. Operand source = node.GetSource(index);
  85. if (source.Kind == OperandKind.Register)
  86. {
  87. Register register = source.GetRegister();
  88. localInputs[block.Index] |= GetMask(register) & ~localOutputs[block.Index];
  89. }
  90. }
  91. if (node.Destination != default && node.Destination.Kind == OperandKind.Register)
  92. {
  93. localOutputs[block.Index] |= GetMask(node.Destination.GetRegister());
  94. }
  95. }
  96. }
  97. // Compute global register inputs and outputs used across blocks.
  98. RegisterMask[] globalCmnOutputs = new RegisterMask[cfg.Blocks.Count];
  99. RegisterMask[] globalInputs = new RegisterMask[cfg.Blocks.Count];
  100. RegisterMask[] globalOutputs = new RegisterMask[cfg.Blocks.Count];
  101. bool modified;
  102. bool firstPass = true;
  103. do
  104. {
  105. modified = false;
  106. // Compute register outputs.
  107. for (int index = cfg.PostOrderBlocks.Length - 1; index >= 0; index--)
  108. {
  109. BasicBlock block = cfg.PostOrderBlocks[index];
  110. if (block.Predecessors.Count != 0 && !HasContextLoad(block))
  111. {
  112. BasicBlock predecessor = block.Predecessors[0];
  113. RegisterMask cmnOutputs = localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  114. RegisterMask outputs = globalOutputs[predecessor.Index];
  115. for (int pIndex = 1; pIndex < block.Predecessors.Count; pIndex++)
  116. {
  117. predecessor = block.Predecessors[pIndex];
  118. cmnOutputs &= localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  119. outputs |= globalOutputs[predecessor.Index];
  120. }
  121. globalInputs[block.Index] |= outputs & ~cmnOutputs;
  122. if (!firstPass)
  123. {
  124. cmnOutputs &= globalCmnOutputs[block.Index];
  125. }
  126. modified |= Exchange(globalCmnOutputs, block.Index, cmnOutputs);
  127. outputs |= localOutputs[block.Index];
  128. modified |= Exchange(globalOutputs, block.Index, globalOutputs[block.Index] | outputs);
  129. }
  130. else
  131. {
  132. modified |= Exchange(globalOutputs, block.Index, localOutputs[block.Index]);
  133. }
  134. }
  135. // Compute register inputs.
  136. for (int index = 0; index < cfg.PostOrderBlocks.Length; index++)
  137. {
  138. BasicBlock block = cfg.PostOrderBlocks[index];
  139. RegisterMask inputs = localInputs[block.Index];
  140. for (int i = 0; i < block.SuccessorsCount; i++)
  141. {
  142. inputs |= globalInputs[block.GetSuccessor(i).Index];
  143. }
  144. inputs &= ~globalCmnOutputs[block.Index];
  145. modified |= Exchange(globalInputs, block.Index, globalInputs[block.Index] | inputs);
  146. }
  147. firstPass = false;
  148. }
  149. while (modified);
  150. // Insert load and store context instructions where needed.
  151. for (BasicBlock block = cfg.Blocks.First; block != null; block = block.ListNext)
  152. {
  153. bool hasContextLoad = HasContextLoad(block);
  154. if (hasContextLoad)
  155. {
  156. block.Operations.Remove(block.Operations.First);
  157. }
  158. Operand arg = default;
  159. // The only block without any predecessor should be the entry block.
  160. // It always needs a context load as it is the first block to run.
  161. if (block.Predecessors.Count == 0 || hasContextLoad)
  162. {
  163. long vecMask = globalInputs[block.Index].VecMask;
  164. long intMask = globalInputs[block.Index].IntMask;
  165. if (vecMask != 0 || intMask != 0)
  166. {
  167. arg = Local(OperandType.I64);
  168. Operation loadArg = block.Operations.AddFirst(Operation(Instruction.LoadArgument, arg, Const(0)));
  169. LoadLocals(block, vecMask, RegisterType.Vector, mode, loadArg, arg);
  170. LoadLocals(block, intMask, RegisterType.Integer, mode, loadArg, arg);
  171. }
  172. }
  173. bool hasContextStore = HasContextStore(block);
  174. if (hasContextStore)
  175. {
  176. block.Operations.Remove(block.Operations.Last);
  177. }
  178. if (EndsWithReturn(block) || hasContextStore)
  179. {
  180. long vecMask = globalOutputs[block.Index].VecMask;
  181. long intMask = globalOutputs[block.Index].IntMask;
  182. if (vecMask != 0 || intMask != 0)
  183. {
  184. if (arg == default)
  185. {
  186. arg = Local(OperandType.I64);
  187. block.Append(Operation(Instruction.LoadArgument, arg, Const(0)));
  188. }
  189. StoreLocals(block, intMask, RegisterType.Integer, mode, arg);
  190. StoreLocals(block, vecMask, RegisterType.Vector, mode, arg);
  191. }
  192. }
  193. }
  194. }
  195. private static bool HasContextLoad(BasicBlock block)
  196. {
  197. return StartsWith(block, Instruction.LoadFromContext) && block.Operations.First.SourcesCount == 0;
  198. }
  199. private static bool HasContextStore(BasicBlock block)
  200. {
  201. return EndsWith(block, Instruction.StoreToContext) && block.Operations.Last.SourcesCount == 0;
  202. }
  203. private static bool StartsWith(BasicBlock block, Instruction inst)
  204. {
  205. if (block.Operations.Count > 0)
  206. {
  207. Operation first = block.Operations.First;
  208. return first != default && first.Instruction == inst;
  209. }
  210. return false;
  211. }
  212. private static bool EndsWith(BasicBlock block, Instruction inst)
  213. {
  214. if (block.Operations.Count > 0)
  215. {
  216. Operation last = block.Operations.Last;
  217. return last != default && last.Instruction == inst;
  218. }
  219. return false;
  220. }
  221. private static RegisterMask GetMask(Register register)
  222. {
  223. long intMask = 0;
  224. long vecMask = 0;
  225. switch (register.Type)
  226. {
  227. case RegisterType.Flag: intMask = (1L << RegsCount) << register.Index; break;
  228. case RegisterType.Integer: intMask = 1L << register.Index; break;
  229. case RegisterType.FpFlag: vecMask = (1L << RegsCount) << register.Index; break;
  230. case RegisterType.Vector: vecMask = 1L << register.Index; break;
  231. }
  232. return new RegisterMask(intMask, vecMask);
  233. }
  234. private static bool Exchange(RegisterMask[] masks, int blkIndex, RegisterMask value)
  235. {
  236. ref RegisterMask curValue = ref masks[blkIndex];
  237. bool changed = curValue != value;
  238. curValue = value;
  239. return changed;
  240. }
  241. private static void LoadLocals(
  242. BasicBlock block,
  243. long inputs,
  244. RegisterType baseType,
  245. ExecutionMode mode,
  246. Operation loadArg,
  247. Operand arg)
  248. {
  249. while (inputs != 0)
  250. {
  251. int bit = 63 - BitOperations.LeadingZeroCount((ulong)inputs);
  252. Operand dest = GetRegFromBit(bit, baseType, mode);
  253. Operand offset = Const((long)NativeContext.GetRegisterOffset(dest.GetRegister()));
  254. Operand addr = Local(OperandType.I64);
  255. block.Operations.AddAfter(loadArg, Operation(Instruction.Load, dest, addr));
  256. block.Operations.AddAfter(loadArg, Operation(Instruction.Add, addr, arg, offset));
  257. inputs &= ~(1L << bit);
  258. }
  259. }
  260. private static void StoreLocals(
  261. BasicBlock block,
  262. long outputs,
  263. RegisterType baseType,
  264. ExecutionMode mode,
  265. Operand arg)
  266. {
  267. while (outputs != 0)
  268. {
  269. int bit = BitOperations.TrailingZeroCount(outputs);
  270. Operand source = GetRegFromBit(bit, baseType, mode);
  271. Operand offset = Const((long)NativeContext.GetRegisterOffset(source.GetRegister()));
  272. Operand addr = Local(OperandType.I64);
  273. block.Append(Operation(Instruction.Add, addr, arg, offset));
  274. block.Append(Operation(Instruction.Store, default, addr, source));
  275. outputs &= ~(1L << bit);
  276. }
  277. }
  278. private static Operand GetRegFromBit(int bit, RegisterType baseType, ExecutionMode mode)
  279. {
  280. if (bit < RegsCount)
  281. {
  282. return Register(bit, baseType, GetOperandType(baseType, mode));
  283. }
  284. else if (baseType == RegisterType.Integer)
  285. {
  286. return Register(bit & RegsMask, RegisterType.Flag, OperandType.I32);
  287. }
  288. else if (baseType == RegisterType.Vector)
  289. {
  290. return Register(bit & RegsMask, RegisterType.FpFlag, OperandType.I32);
  291. }
  292. else
  293. {
  294. throw new ArgumentOutOfRangeException(nameof(bit));
  295. }
  296. }
  297. private static OperandType GetOperandType(RegisterType type, ExecutionMode mode)
  298. {
  299. switch (type)
  300. {
  301. case RegisterType.Flag: return OperandType.I32;
  302. case RegisterType.FpFlag: return OperandType.I32;
  303. case RegisterType.Integer: return (mode == ExecutionMode.Aarch64) ? OperandType.I64 : OperandType.I32;
  304. case RegisterType.Vector: return OperandType.V128;
  305. }
  306. throw new ArgumentException($"Invalid register type \"{type}\".");
  307. }
  308. private static bool EndsWithReturn(BasicBlock block)
  309. {
  310. Operation last = block.Operations.Last;
  311. return last != default && last.Instruction == Instruction.Return;
  312. }
  313. }
  314. }