RegisterUsage.cs 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420
  1. using ARMeilleure.IntermediateRepresentation;
  2. using ARMeilleure.State;
  3. using System;
  4. using static ARMeilleure.IntermediateRepresentation.OperandHelper;
  5. namespace ARMeilleure.Translation
  6. {
  7. static class RegisterUsage
  8. {
  9. private const long CallerSavedIntRegistersMask = 0x7fL << 9;
  10. private const long PStateNzcvFlagsMask = 0xfL << 60;
  11. private const long FpStateNzcvFlagsMask = 0xfL << 60;
  12. private const long CallerSavedVecRegistersMask = 0xffffL << 16;
  13. private const int RegsCount = 32;
  14. private const int RegsMask = RegsCount - 1;
  15. private struct RegisterMask : IEquatable<RegisterMask>
  16. {
  17. public long IntMask { get; set; }
  18. public long VecMask { get; set; }
  19. public RegisterMask(long intMask, long vecMask)
  20. {
  21. IntMask = intMask;
  22. VecMask = vecMask;
  23. }
  24. public static RegisterMask operator &(RegisterMask x, RegisterMask y)
  25. {
  26. return new RegisterMask(x.IntMask & y.IntMask, x.VecMask & y.VecMask);
  27. }
  28. public static RegisterMask operator |(RegisterMask x, RegisterMask y)
  29. {
  30. return new RegisterMask(x.IntMask | y.IntMask, x.VecMask | y.VecMask);
  31. }
  32. public static RegisterMask operator ~(RegisterMask x)
  33. {
  34. return new RegisterMask(~x.IntMask, ~x.VecMask);
  35. }
  36. public static bool operator ==(RegisterMask x, RegisterMask y)
  37. {
  38. return x.Equals(y);
  39. }
  40. public static bool operator !=(RegisterMask x, RegisterMask y)
  41. {
  42. return !x.Equals(y);
  43. }
  44. public override bool Equals(object obj)
  45. {
  46. return obj is RegisterMask regMask && Equals(regMask);
  47. }
  48. public bool Equals(RegisterMask other)
  49. {
  50. return IntMask == other.IntMask && VecMask == other.VecMask;
  51. }
  52. public override int GetHashCode()
  53. {
  54. return HashCode.Combine(IntMask, VecMask);
  55. }
  56. }
  57. public static void RunPass(ControlFlowGraph cfg, ExecutionMode mode, bool isCompleteFunction)
  58. {
  59. // Compute local register inputs and outputs used inside blocks.
  60. RegisterMask[] localInputs = new RegisterMask[cfg.Blocks.Count];
  61. RegisterMask[] localOutputs = new RegisterMask[cfg.Blocks.Count];
  62. for (BasicBlock block = cfg.Blocks.First; block != null; block = block.ListNext)
  63. {
  64. for (Node node = block.Operations.First; node != null; node = node.ListNext)
  65. {
  66. Operation operation = node as Operation;
  67. for (int srcIndex = 0; srcIndex < operation.SourcesCount; srcIndex++)
  68. {
  69. Operand source = operation.GetSource(srcIndex);
  70. if (source.Kind != OperandKind.Register)
  71. {
  72. continue;
  73. }
  74. Register register = source.GetRegister();
  75. localInputs[block.Index] |= GetMask(register) & ~localOutputs[block.Index];
  76. }
  77. if (operation.Destination != null && operation.Destination.Kind == OperandKind.Register)
  78. {
  79. localOutputs[block.Index] |= GetMask(operation.Destination.GetRegister());
  80. }
  81. }
  82. }
  83. // Compute global register inputs and outputs used across blocks.
  84. RegisterMask[] globalCmnOutputs = new RegisterMask[cfg.Blocks.Count];
  85. RegisterMask[] globalInputs = new RegisterMask[cfg.Blocks.Count];
  86. RegisterMask[] globalOutputs = new RegisterMask[cfg.Blocks.Count];
  87. bool modified;
  88. bool firstPass = true;
  89. do
  90. {
  91. modified = false;
  92. // Compute register outputs.
  93. for (int index = cfg.PostOrderBlocks.Length - 1; index >= 0; index--)
  94. {
  95. BasicBlock block = cfg.PostOrderBlocks[index];
  96. if (block.Predecessors.Count != 0 && !HasContextLoad(block))
  97. {
  98. BasicBlock predecessor = block.Predecessors[0];
  99. RegisterMask cmnOutputs = localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  100. RegisterMask outputs = globalOutputs[predecessor.Index];
  101. for (int pIndex = 1; pIndex < block.Predecessors.Count; pIndex++)
  102. {
  103. predecessor = block.Predecessors[pIndex];
  104. cmnOutputs &= localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  105. outputs |= globalOutputs[predecessor.Index];
  106. }
  107. globalInputs[block.Index] |= outputs & ~cmnOutputs;
  108. if (!firstPass)
  109. {
  110. cmnOutputs &= globalCmnOutputs[block.Index];
  111. }
  112. if (Exchange(globalCmnOutputs, block.Index, cmnOutputs))
  113. {
  114. modified = true;
  115. }
  116. outputs |= localOutputs[block.Index];
  117. if (Exchange(globalOutputs, block.Index, globalOutputs[block.Index] | outputs))
  118. {
  119. modified = true;
  120. }
  121. }
  122. else if (Exchange(globalOutputs, block.Index, localOutputs[block.Index]))
  123. {
  124. modified = true;
  125. }
  126. }
  127. // Compute register inputs.
  128. for (int index = 0; index < cfg.PostOrderBlocks.Length; index++)
  129. {
  130. BasicBlock block = cfg.PostOrderBlocks[index];
  131. RegisterMask inputs = localInputs[block.Index];
  132. if (block.Next != null)
  133. {
  134. inputs |= globalInputs[block.Next.Index];
  135. }
  136. if (block.Branch != null)
  137. {
  138. inputs |= globalInputs[block.Branch.Index];
  139. }
  140. inputs &= ~globalCmnOutputs[block.Index];
  141. if (Exchange(globalInputs, block.Index, globalInputs[block.Index] | inputs))
  142. {
  143. modified = true;
  144. }
  145. }
  146. firstPass = false;
  147. }
  148. while (modified);
  149. // Insert load and store context instructions where needed.
  150. for (BasicBlock block = cfg.Blocks.First; block != null; block = block.ListNext)
  151. {
  152. bool hasContextLoad = HasContextLoad(block);
  153. if (hasContextLoad)
  154. {
  155. block.Operations.Remove(block.Operations.First);
  156. }
  157. // The only block without any predecessor should be the entry block.
  158. // It always needs a context load as it is the first block to run.
  159. if (block.Predecessors.Count == 0 || hasContextLoad)
  160. {
  161. LoadLocals(block, globalInputs[block.Index].VecMask, RegisterType.Vector, mode);
  162. LoadLocals(block, globalInputs[block.Index].IntMask, RegisterType.Integer, mode);
  163. }
  164. bool hasContextStore = HasContextStore(block);
  165. if (hasContextStore)
  166. {
  167. block.Operations.Remove(block.Operations.Last);
  168. }
  169. if (EndsWithReturn(block) || hasContextStore)
  170. {
  171. StoreLocals(block, globalOutputs[block.Index].IntMask, RegisterType.Integer, mode, isCompleteFunction);
  172. StoreLocals(block, globalOutputs[block.Index].VecMask, RegisterType.Vector, mode, isCompleteFunction);
  173. }
  174. }
  175. }
  176. private static bool HasContextLoad(BasicBlock block)
  177. {
  178. return StartsWith(block, Instruction.LoadFromContext) && block.Operations.First.SourcesCount == 0;
  179. }
  180. private static bool HasContextStore(BasicBlock block)
  181. {
  182. return EndsWith(block, Instruction.StoreToContext) && block.GetLastOp().SourcesCount == 0;
  183. }
  184. private static bool StartsWith(BasicBlock block, Instruction inst)
  185. {
  186. if (block.Operations.Count == 0)
  187. {
  188. return false;
  189. }
  190. return block.Operations.First is Operation operation && operation.Instruction == inst;
  191. }
  192. private static bool EndsWith(BasicBlock block, Instruction inst)
  193. {
  194. if (block.Operations.Count == 0)
  195. {
  196. return false;
  197. }
  198. return block.Operations.Last is Operation operation && operation.Instruction == inst;
  199. }
  200. private static RegisterMask GetMask(Register register)
  201. {
  202. long intMask = 0;
  203. long vecMask = 0;
  204. switch (register.Type)
  205. {
  206. case RegisterType.Flag: intMask = (1L << RegsCount) << register.Index; break;
  207. case RegisterType.Integer: intMask = 1L << register.Index; break;
  208. case RegisterType.FpFlag: vecMask = (1L << RegsCount) << register.Index; break;
  209. case RegisterType.Vector: vecMask = 1L << register.Index; break;
  210. }
  211. return new RegisterMask(intMask, vecMask);
  212. }
  213. private static bool Exchange(RegisterMask[] masks, int blkIndex, RegisterMask value)
  214. {
  215. RegisterMask oldValue = masks[blkIndex];
  216. masks[blkIndex] = value;
  217. return oldValue != value;
  218. }
  219. private static void LoadLocals(BasicBlock block, long inputs, RegisterType baseType, ExecutionMode mode)
  220. {
  221. Operand arg0 = Local(OperandType.I64);
  222. for (int bit = 63; bit >= 0; bit--)
  223. {
  224. long mask = 1L << bit;
  225. if ((inputs & mask) == 0)
  226. {
  227. continue;
  228. }
  229. Operand dest = GetRegFromBit(bit, baseType, mode);
  230. long offset = NativeContext.GetRegisterOffset(dest.GetRegister());
  231. Operand addr = Local(OperandType.I64);
  232. Operation loadOp = new Operation(Instruction.Load, dest, addr);
  233. block.Operations.AddFirst(loadOp);
  234. Operation calcOffsOp = new Operation(Instruction.Add, addr, arg0, Const(offset));
  235. block.Operations.AddFirst(calcOffsOp);
  236. }
  237. Operation loadArg0 = new Operation(Instruction.LoadArgument, arg0, Const(0));
  238. block.Operations.AddFirst(loadArg0);
  239. }
  240. private static void StoreLocals(BasicBlock block, long outputs, RegisterType baseType, ExecutionMode mode, bool isCompleteFunction)
  241. {
  242. if (Optimizations.AssumeStrictAbiCompliance && isCompleteFunction)
  243. {
  244. if (baseType == RegisterType.Integer || baseType == RegisterType.Flag)
  245. {
  246. outputs = ClearCallerSavedIntRegs(outputs);
  247. }
  248. else /* if (baseType == RegisterType.Vector || baseType == RegisterType.FpFlag) */
  249. {
  250. outputs = ClearCallerSavedVecRegs(outputs);
  251. }
  252. }
  253. Operand arg0 = Local(OperandType.I64);
  254. Operation loadArg0 = new Operation(Instruction.LoadArgument, arg0, Const(0));
  255. block.Append(loadArg0);
  256. for (int bit = 0; bit < 64; bit++)
  257. {
  258. long mask = 1L << bit;
  259. if ((outputs & mask) == 0)
  260. {
  261. continue;
  262. }
  263. Operand source = GetRegFromBit(bit, baseType, mode);
  264. long offset = NativeContext.GetRegisterOffset(source.GetRegister());
  265. Operand addr = Local(OperandType.I64);
  266. Operation calcOffsOp = new Operation(Instruction.Add, addr, arg0, Const(offset));
  267. block.Append(calcOffsOp);
  268. Operation storeOp = new Operation(Instruction.Store, null, addr, source);
  269. block.Append(storeOp);
  270. }
  271. }
  272. private static Operand GetRegFromBit(int bit, RegisterType baseType, ExecutionMode mode)
  273. {
  274. if (bit < RegsCount)
  275. {
  276. return new Operand(bit, baseType, GetOperandType(baseType, mode));
  277. }
  278. else if (baseType == RegisterType.Integer)
  279. {
  280. return new Operand(bit & RegsMask, RegisterType.Flag, OperandType.I32);
  281. }
  282. else if (baseType == RegisterType.Vector)
  283. {
  284. return new Operand(bit & RegsMask, RegisterType.FpFlag, OperandType.I32);
  285. }
  286. else
  287. {
  288. throw new ArgumentOutOfRangeException(nameof(bit));
  289. }
  290. }
  291. private static OperandType GetOperandType(RegisterType type, ExecutionMode mode)
  292. {
  293. switch (type)
  294. {
  295. case RegisterType.Flag: return OperandType.I32;
  296. case RegisterType.FpFlag: return OperandType.I32;
  297. case RegisterType.Integer: return (mode == ExecutionMode.Aarch64) ? OperandType.I64 : OperandType.I32;
  298. case RegisterType.Vector: return OperandType.V128;
  299. }
  300. throw new ArgumentException($"Invalid register type \"{type}\".");
  301. }
  302. private static bool EndsWithReturn(BasicBlock block)
  303. {
  304. if (!(block.GetLastOp() is Operation operation))
  305. {
  306. return false;
  307. }
  308. return operation.Instruction == Instruction.Return;
  309. }
  310. private static long ClearCallerSavedIntRegs(long mask)
  311. {
  312. // TODO: ARM32 support.
  313. mask &= ~(CallerSavedIntRegistersMask | PStateNzcvFlagsMask);
  314. return mask;
  315. }
  316. private static long ClearCallerSavedVecRegs(long mask)
  317. {
  318. // TODO: ARM32 support.
  319. mask &= ~(CallerSavedVecRegistersMask | FpStateNzcvFlagsMask);
  320. return mask;
  321. }
  322. }
  323. }