RegisterUsage.cs 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416
  1. using ARMeilleure.IntermediateRepresentation;
  2. using ARMeilleure.State;
  3. using System;
  4. using static ARMeilleure.IntermediateRepresentation.OperandHelper;
  5. using static ARMeilleure.IntermediateRepresentation.OperationHelper;
  6. namespace ARMeilleure.Translation
  7. {
  8. static class RegisterUsage
  9. {
  10. private const long CallerSavedIntRegistersMask = 0x7fL << 9;
  11. private const long PStateNzcvFlagsMask = 0xfL << 60;
  12. private const long FpStateNzcvFlagsMask = 0xfL << 60;
  13. private const long CallerSavedVecRegistersMask = 0xffffL << 16;
  14. private const int RegsCount = 32;
  15. private const int RegsMask = RegsCount - 1;
  16. private struct RegisterMask : IEquatable<RegisterMask>
  17. {
  18. public long IntMask { get; set; }
  19. public long VecMask { get; set; }
  20. public RegisterMask(long intMask, long vecMask)
  21. {
  22. IntMask = intMask;
  23. VecMask = vecMask;
  24. }
  25. public static RegisterMask operator &(RegisterMask x, RegisterMask y)
  26. {
  27. return new RegisterMask(x.IntMask & y.IntMask, x.VecMask & y.VecMask);
  28. }
  29. public static RegisterMask operator |(RegisterMask x, RegisterMask y)
  30. {
  31. return new RegisterMask(x.IntMask | y.IntMask, x.VecMask | y.VecMask);
  32. }
  33. public static RegisterMask operator ~(RegisterMask x)
  34. {
  35. return new RegisterMask(~x.IntMask, ~x.VecMask);
  36. }
  37. public static bool operator ==(RegisterMask x, RegisterMask y)
  38. {
  39. return x.Equals(y);
  40. }
  41. public static bool operator !=(RegisterMask x, RegisterMask y)
  42. {
  43. return !x.Equals(y);
  44. }
  45. public override bool Equals(object obj)
  46. {
  47. return obj is RegisterMask regMask && Equals(regMask);
  48. }
  49. public bool Equals(RegisterMask other)
  50. {
  51. return IntMask == other.IntMask && VecMask == other.VecMask;
  52. }
  53. public override int GetHashCode()
  54. {
  55. return HashCode.Combine(IntMask, VecMask);
  56. }
  57. }
  58. public static void RunPass(ControlFlowGraph cfg, ExecutionMode mode, bool isCompleteFunction)
  59. {
  60. // Compute local register inputs and outputs used inside blocks.
  61. RegisterMask[] localInputs = new RegisterMask[cfg.Blocks.Count];
  62. RegisterMask[] localOutputs = new RegisterMask[cfg.Blocks.Count];
  63. for (BasicBlock block = cfg.Blocks.First; block != null; block = block.ListNext)
  64. {
  65. for (Node node = block.Operations.First; node != null; node = node.ListNext)
  66. {
  67. Operation operation = node as Operation;
  68. for (int srcIndex = 0; srcIndex < operation.SourcesCount; srcIndex++)
  69. {
  70. Operand source = operation.GetSource(srcIndex);
  71. if (source.Kind != OperandKind.Register)
  72. {
  73. continue;
  74. }
  75. Register register = source.GetRegister();
  76. localInputs[block.Index] |= GetMask(register) & ~localOutputs[block.Index];
  77. }
  78. if (operation.Destination != null && operation.Destination.Kind == OperandKind.Register)
  79. {
  80. localOutputs[block.Index] |= GetMask(operation.Destination.GetRegister());
  81. }
  82. }
  83. }
  84. // Compute global register inputs and outputs used across blocks.
  85. RegisterMask[] globalCmnOutputs = new RegisterMask[cfg.Blocks.Count];
  86. RegisterMask[] globalInputs = new RegisterMask[cfg.Blocks.Count];
  87. RegisterMask[] globalOutputs = new RegisterMask[cfg.Blocks.Count];
  88. bool modified;
  89. bool firstPass = true;
  90. do
  91. {
  92. modified = false;
  93. // Compute register outputs.
  94. for (int index = cfg.PostOrderBlocks.Length - 1; index >= 0; index--)
  95. {
  96. BasicBlock block = cfg.PostOrderBlocks[index];
  97. if (block.Predecessors.Count != 0 && !HasContextLoad(block))
  98. {
  99. BasicBlock predecessor = block.Predecessors[0];
  100. RegisterMask cmnOutputs = localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  101. RegisterMask outputs = globalOutputs[predecessor.Index];
  102. for (int pIndex = 1; pIndex < block.Predecessors.Count; pIndex++)
  103. {
  104. predecessor = block.Predecessors[pIndex];
  105. cmnOutputs &= localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  106. outputs |= globalOutputs[predecessor.Index];
  107. }
  108. globalInputs[block.Index] |= outputs & ~cmnOutputs;
  109. if (!firstPass)
  110. {
  111. cmnOutputs &= globalCmnOutputs[block.Index];
  112. }
  113. if (Exchange(globalCmnOutputs, block.Index, cmnOutputs))
  114. {
  115. modified = true;
  116. }
  117. outputs |= localOutputs[block.Index];
  118. if (Exchange(globalOutputs, block.Index, globalOutputs[block.Index] | outputs))
  119. {
  120. modified = true;
  121. }
  122. }
  123. else if (Exchange(globalOutputs, block.Index, localOutputs[block.Index]))
  124. {
  125. modified = true;
  126. }
  127. }
  128. // Compute register inputs.
  129. for (int index = 0; index < cfg.PostOrderBlocks.Length; index++)
  130. {
  131. BasicBlock block = cfg.PostOrderBlocks[index];
  132. RegisterMask inputs = localInputs[block.Index];
  133. for (int i = 0; i < block.SuccessorCount; i++)
  134. {
  135. inputs |= globalInputs[block.GetSuccessor(i).Index];
  136. }
  137. inputs &= ~globalCmnOutputs[block.Index];
  138. if (Exchange(globalInputs, block.Index, globalInputs[block.Index] | inputs))
  139. {
  140. modified = true;
  141. }
  142. }
  143. firstPass = false;
  144. }
  145. while (modified);
  146. // Insert load and store context instructions where needed.
  147. for (BasicBlock block = cfg.Blocks.First; block != null; block = block.ListNext)
  148. {
  149. bool hasContextLoad = HasContextLoad(block);
  150. if (hasContextLoad)
  151. {
  152. block.Operations.Remove(block.Operations.First);
  153. }
  154. // The only block without any predecessor should be the entry block.
  155. // It always needs a context load as it is the first block to run.
  156. if (block.Predecessors.Count == 0 || hasContextLoad)
  157. {
  158. LoadLocals(block, globalInputs[block.Index].VecMask, RegisterType.Vector, mode);
  159. LoadLocals(block, globalInputs[block.Index].IntMask, RegisterType.Integer, mode);
  160. }
  161. bool hasContextStore = HasContextStore(block);
  162. if (hasContextStore)
  163. {
  164. block.Operations.Remove(block.Operations.Last);
  165. }
  166. if (EndsWithReturn(block) || hasContextStore)
  167. {
  168. StoreLocals(block, globalOutputs[block.Index].IntMask, RegisterType.Integer, mode, isCompleteFunction);
  169. StoreLocals(block, globalOutputs[block.Index].VecMask, RegisterType.Vector, mode, isCompleteFunction);
  170. }
  171. }
  172. }
  173. private static bool HasContextLoad(BasicBlock block)
  174. {
  175. return StartsWith(block, Instruction.LoadFromContext) && block.Operations.First.SourcesCount == 0;
  176. }
  177. private static bool HasContextStore(BasicBlock block)
  178. {
  179. return EndsWith(block, Instruction.StoreToContext) && block.GetLastOp().SourcesCount == 0;
  180. }
  181. private static bool StartsWith(BasicBlock block, Instruction inst)
  182. {
  183. if (block.Operations.Count == 0)
  184. {
  185. return false;
  186. }
  187. return block.Operations.First is Operation operation && operation.Instruction == inst;
  188. }
  189. private static bool EndsWith(BasicBlock block, Instruction inst)
  190. {
  191. if (block.Operations.Count == 0)
  192. {
  193. return false;
  194. }
  195. return block.Operations.Last is Operation operation && operation.Instruction == inst;
  196. }
  197. private static RegisterMask GetMask(Register register)
  198. {
  199. long intMask = 0;
  200. long vecMask = 0;
  201. switch (register.Type)
  202. {
  203. case RegisterType.Flag: intMask = (1L << RegsCount) << register.Index; break;
  204. case RegisterType.Integer: intMask = 1L << register.Index; break;
  205. case RegisterType.FpFlag: vecMask = (1L << RegsCount) << register.Index; break;
  206. case RegisterType.Vector: vecMask = 1L << register.Index; break;
  207. }
  208. return new RegisterMask(intMask, vecMask);
  209. }
  210. private static bool Exchange(RegisterMask[] masks, int blkIndex, RegisterMask value)
  211. {
  212. RegisterMask oldValue = masks[blkIndex];
  213. masks[blkIndex] = value;
  214. return oldValue != value;
  215. }
  216. private static void LoadLocals(BasicBlock block, long inputs, RegisterType baseType, ExecutionMode mode)
  217. {
  218. Operand arg0 = Local(OperandType.I64);
  219. for (int bit = 63; bit >= 0; bit--)
  220. {
  221. long mask = 1L << bit;
  222. if ((inputs & mask) == 0)
  223. {
  224. continue;
  225. }
  226. Operand dest = GetRegFromBit(bit, baseType, mode);
  227. long offset = NativeContext.GetRegisterOffset(dest.GetRegister());
  228. Operand addr = Local(OperandType.I64);
  229. Operation loadOp = Operation(Instruction.Load, dest, addr);
  230. block.Operations.AddFirst(loadOp);
  231. Operation calcOffsOp = Operation(Instruction.Add, addr, arg0, Const(offset));
  232. block.Operations.AddFirst(calcOffsOp);
  233. }
  234. Operation loadArg0 = Operation(Instruction.LoadArgument, arg0, Const(0));
  235. block.Operations.AddFirst(loadArg0);
  236. }
  237. private static void StoreLocals(BasicBlock block, long outputs, RegisterType baseType, ExecutionMode mode, bool isCompleteFunction)
  238. {
  239. if (Optimizations.AssumeStrictAbiCompliance && isCompleteFunction)
  240. {
  241. if (baseType == RegisterType.Integer || baseType == RegisterType.Flag)
  242. {
  243. outputs = ClearCallerSavedIntRegs(outputs);
  244. }
  245. else /* if (baseType == RegisterType.Vector || baseType == RegisterType.FpFlag) */
  246. {
  247. outputs = ClearCallerSavedVecRegs(outputs);
  248. }
  249. }
  250. Operand arg0 = Local(OperandType.I64);
  251. Operation loadArg0 = Operation(Instruction.LoadArgument, arg0, Const(0));
  252. block.Append(loadArg0);
  253. for (int bit = 0; bit < 64; bit++)
  254. {
  255. long mask = 1L << bit;
  256. if ((outputs & mask) == 0)
  257. {
  258. continue;
  259. }
  260. Operand source = GetRegFromBit(bit, baseType, mode);
  261. long offset = NativeContext.GetRegisterOffset(source.GetRegister());
  262. Operand addr = Local(OperandType.I64);
  263. Operation calcOffsOp = Operation(Instruction.Add, addr, arg0, Const(offset));
  264. block.Append(calcOffsOp);
  265. Operation storeOp = Operation(Instruction.Store, null, addr, source);
  266. block.Append(storeOp);
  267. }
  268. }
  269. private static Operand GetRegFromBit(int bit, RegisterType baseType, ExecutionMode mode)
  270. {
  271. if (bit < RegsCount)
  272. {
  273. return OperandHelper.Register(bit, baseType, GetOperandType(baseType, mode));
  274. }
  275. else if (baseType == RegisterType.Integer)
  276. {
  277. return OperandHelper.Register(bit & RegsMask, RegisterType.Flag, OperandType.I32);
  278. }
  279. else if (baseType == RegisterType.Vector)
  280. {
  281. return OperandHelper.Register(bit & RegsMask, RegisterType.FpFlag, OperandType.I32);
  282. }
  283. else
  284. {
  285. throw new ArgumentOutOfRangeException(nameof(bit));
  286. }
  287. }
  288. private static OperandType GetOperandType(RegisterType type, ExecutionMode mode)
  289. {
  290. switch (type)
  291. {
  292. case RegisterType.Flag: return OperandType.I32;
  293. case RegisterType.FpFlag: return OperandType.I32;
  294. case RegisterType.Integer: return (mode == ExecutionMode.Aarch64) ? OperandType.I64 : OperandType.I32;
  295. case RegisterType.Vector: return OperandType.V128;
  296. }
  297. throw new ArgumentException($"Invalid register type \"{type}\".");
  298. }
  299. private static bool EndsWithReturn(BasicBlock block)
  300. {
  301. if (!(block.GetLastOp() is Operation operation))
  302. {
  303. return false;
  304. }
  305. return operation.Instruction == Instruction.Return;
  306. }
  307. private static long ClearCallerSavedIntRegs(long mask)
  308. {
  309. // TODO: ARM32 support.
  310. mask &= ~(CallerSavedIntRegistersMask | PStateNzcvFlagsMask);
  311. return mask;
  312. }
  313. private static long ClearCallerSavedVecRegs(long mask)
  314. {
  315. // TODO: ARM32 support.
  316. mask &= ~(CallerSavedVecRegistersMask | FpStateNzcvFlagsMask);
  317. return mask;
  318. }
  319. }
  320. }