RegisterUsage.cs 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413
  1. using ARMeilleure.IntermediateRepresentation;
  2. using ARMeilleure.State;
  3. using System;
  4. using static ARMeilleure.IntermediateRepresentation.OperandHelper;
  5. namespace ARMeilleure.Translation
  6. {
  7. static class RegisterUsage
  8. {
  9. private const long CallerSavedIntRegistersMask = 0x7fL << 9;
  10. private const long PStateNzcvFlagsMask = 0xfL << 60;
  11. private const long CallerSavedVecRegistersMask = 0xffffL << 16;
  12. private const int RegsCount = 32;
  13. private const int RegsMask = RegsCount - 1;
  14. private struct RegisterMask : IEquatable<RegisterMask>
  15. {
  16. public long IntMask { get; set; }
  17. public long VecMask { get; set; }
  18. public RegisterMask(long intMask, long vecMask)
  19. {
  20. IntMask = intMask;
  21. VecMask = vecMask;
  22. }
  23. public static RegisterMask operator &(RegisterMask x, RegisterMask y)
  24. {
  25. return new RegisterMask(x.IntMask & y.IntMask, x.VecMask & y.VecMask);
  26. }
  27. public static RegisterMask operator |(RegisterMask x, RegisterMask y)
  28. {
  29. return new RegisterMask(x.IntMask | y.IntMask, x.VecMask | y.VecMask);
  30. }
  31. public static RegisterMask operator ~(RegisterMask x)
  32. {
  33. return new RegisterMask(~x.IntMask, ~x.VecMask);
  34. }
  35. public static bool operator ==(RegisterMask x, RegisterMask y)
  36. {
  37. return x.Equals(y);
  38. }
  39. public static bool operator !=(RegisterMask x, RegisterMask y)
  40. {
  41. return !x.Equals(y);
  42. }
  43. public override bool Equals(object obj)
  44. {
  45. return obj is RegisterMask regMask && Equals(regMask);
  46. }
  47. public bool Equals(RegisterMask other)
  48. {
  49. return IntMask == other.IntMask && VecMask == other.VecMask;
  50. }
  51. public override int GetHashCode()
  52. {
  53. return HashCode.Combine(IntMask, VecMask);
  54. }
  55. }
  56. public static void RunPass(ControlFlowGraph cfg, bool isCompleteFunction)
  57. {
  58. // Compute local register inputs and outputs used inside blocks.
  59. RegisterMask[] localInputs = new RegisterMask[cfg.Blocks.Count];
  60. RegisterMask[] localOutputs = new RegisterMask[cfg.Blocks.Count];
  61. foreach (BasicBlock block in cfg.Blocks)
  62. {
  63. foreach (Node node in block.Operations)
  64. {
  65. Operation operation = node as Operation;
  66. for (int srcIndex = 0; srcIndex < operation.SourcesCount; srcIndex++)
  67. {
  68. Operand source = operation.GetSource(srcIndex);
  69. if (source.Kind != OperandKind.Register)
  70. {
  71. continue;
  72. }
  73. Register register = source.GetRegister();
  74. localInputs[block.Index] |= GetMask(register) & ~localOutputs[block.Index];
  75. }
  76. if (operation.Destination != null && operation.Destination.Kind == OperandKind.Register)
  77. {
  78. localOutputs[block.Index] |= GetMask(operation.Destination.GetRegister());
  79. }
  80. }
  81. }
  82. // Compute global register inputs and outputs used across blocks.
  83. RegisterMask[] globalCmnOutputs = new RegisterMask[cfg.Blocks.Count];
  84. RegisterMask[] globalInputs = new RegisterMask[cfg.Blocks.Count];
  85. RegisterMask[] globalOutputs = new RegisterMask[cfg.Blocks.Count];
  86. bool modified;
  87. bool firstPass = true;
  88. do
  89. {
  90. modified = false;
  91. // Compute register outputs.
  92. for (int index = cfg.PostOrderBlocks.Length - 1; index >= 0; index--)
  93. {
  94. BasicBlock block = cfg.PostOrderBlocks[index];
  95. if (block.Predecessors.Count != 0 && !HasContextLoad(block))
  96. {
  97. BasicBlock predecessor = block.Predecessors[0];
  98. RegisterMask cmnOutputs = localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  99. RegisterMask outputs = globalOutputs[predecessor.Index];
  100. for (int pIndex = 1; pIndex < block.Predecessors.Count; pIndex++)
  101. {
  102. predecessor = block.Predecessors[pIndex];
  103. cmnOutputs &= localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  104. outputs |= globalOutputs[predecessor.Index];
  105. }
  106. globalInputs[block.Index] |= outputs & ~cmnOutputs;
  107. if (!firstPass)
  108. {
  109. cmnOutputs &= globalCmnOutputs[block.Index];
  110. }
  111. if (Exchange(globalCmnOutputs, block.Index, cmnOutputs))
  112. {
  113. modified = true;
  114. }
  115. outputs |= localOutputs[block.Index];
  116. if (Exchange(globalOutputs, block.Index, globalOutputs[block.Index] | outputs))
  117. {
  118. modified = true;
  119. }
  120. }
  121. else if (Exchange(globalOutputs, block.Index, localOutputs[block.Index]))
  122. {
  123. modified = true;
  124. }
  125. }
  126. // Compute register inputs.
  127. for (int index = 0; index < cfg.PostOrderBlocks.Length; index++)
  128. {
  129. BasicBlock block = cfg.PostOrderBlocks[index];
  130. RegisterMask inputs = localInputs[block.Index];
  131. if (block.Next != null)
  132. {
  133. inputs |= globalInputs[block.Next.Index];
  134. }
  135. if (block.Branch != null)
  136. {
  137. inputs |= globalInputs[block.Branch.Index];
  138. }
  139. inputs &= ~globalCmnOutputs[block.Index];
  140. if (Exchange(globalInputs, block.Index, globalInputs[block.Index] | inputs))
  141. {
  142. modified = true;
  143. }
  144. }
  145. firstPass = false;
  146. }
  147. while (modified);
  148. // Insert load and store context instructions where needed.
  149. foreach (BasicBlock block in cfg.Blocks)
  150. {
  151. bool hasContextLoad = HasContextLoad(block);
  152. if (hasContextLoad)
  153. {
  154. block.Operations.RemoveFirst();
  155. }
  156. // The only block without any predecessor should be the entry block.
  157. // It always needs a context load as it is the first block to run.
  158. if (block.Predecessors.Count == 0 || hasContextLoad)
  159. {
  160. LoadLocals(block, globalInputs[block.Index].VecMask, RegisterType.Vector);
  161. LoadLocals(block, globalInputs[block.Index].IntMask, RegisterType.Integer);
  162. }
  163. bool hasContextStore = HasContextStore(block);
  164. if (hasContextStore)
  165. {
  166. block.Operations.RemoveLast();
  167. }
  168. if (EndsWithReturn(block) || hasContextStore)
  169. {
  170. StoreLocals(block, globalOutputs[block.Index].IntMask, RegisterType.Integer, isCompleteFunction);
  171. StoreLocals(block, globalOutputs[block.Index].VecMask, RegisterType.Vector, isCompleteFunction);
  172. }
  173. }
  174. }
  175. private static bool HasContextLoad(BasicBlock block)
  176. {
  177. return StartsWith(block, Instruction.LoadFromContext) && block.Operations.First.Value.SourcesCount == 0;
  178. }
  179. private static bool HasContextStore(BasicBlock block)
  180. {
  181. return EndsWith(block, Instruction.StoreToContext) && block.GetLastOp().SourcesCount == 0;
  182. }
  183. private static bool StartsWith(BasicBlock block, Instruction inst)
  184. {
  185. if (block.Operations.Count == 0)
  186. {
  187. return false;
  188. }
  189. return block.Operations.First.Value is Operation operation && operation.Instruction == inst;
  190. }
  191. private static bool EndsWith(BasicBlock block, Instruction inst)
  192. {
  193. if (block.Operations.Count == 0)
  194. {
  195. return false;
  196. }
  197. return block.Operations.Last.Value is Operation operation && operation.Instruction == inst;
  198. }
  199. private static RegisterMask GetMask(Register register)
  200. {
  201. long intMask = 0;
  202. long vecMask = 0;
  203. switch (register.Type)
  204. {
  205. case RegisterType.Flag: intMask = (1L << RegsCount) << register.Index; break;
  206. case RegisterType.Integer: intMask = 1L << register.Index; break;
  207. case RegisterType.Vector: vecMask = 1L << register.Index; break;
  208. }
  209. return new RegisterMask(intMask, vecMask);
  210. }
  211. private static bool Exchange(RegisterMask[] masks, int blkIndex, RegisterMask value)
  212. {
  213. RegisterMask oldValue = masks[blkIndex];
  214. masks[blkIndex] = value;
  215. return oldValue != value;
  216. }
  217. private static void LoadLocals(BasicBlock block, long inputs, RegisterType baseType)
  218. {
  219. Operand arg0 = Local(OperandType.I64);
  220. for (int bit = 63; bit >= 0; bit--)
  221. {
  222. long mask = 1L << bit;
  223. if ((inputs & mask) == 0)
  224. {
  225. continue;
  226. }
  227. Operand dest = GetRegFromBit(bit, baseType);
  228. long offset = NativeContext.GetRegisterOffset(dest.GetRegister());
  229. Operand addr = Local(OperandType.I64);
  230. Operation loadOp = new Operation(Instruction.Load, dest, addr);
  231. block.Operations.AddFirst(loadOp);
  232. Operation calcOffsOp = new Operation(Instruction.Add, addr, arg0, Const(offset));
  233. block.Operations.AddFirst(calcOffsOp);
  234. }
  235. Operation loadArg0 = new Operation(Instruction.LoadArgument, arg0, Const(0));
  236. block.Operations.AddFirst(loadArg0);
  237. }
  238. private static void StoreLocals(BasicBlock block, long outputs, RegisterType baseType, bool isCompleteFunction)
  239. {
  240. if (Optimizations.AssumeStrictAbiCompliance && isCompleteFunction)
  241. {
  242. if (baseType == RegisterType.Integer || baseType == RegisterType.Flag)
  243. {
  244. outputs = ClearCallerSavedIntRegs(outputs);
  245. }
  246. else /* if (baseType == RegisterType.Vector) */
  247. {
  248. outputs = ClearCallerSavedVecRegs(outputs);
  249. }
  250. }
  251. Operand arg0 = Local(OperandType.I64);
  252. Operation loadArg0 = new Operation(Instruction.LoadArgument, arg0, Const(0));
  253. block.Append(loadArg0);
  254. for (int bit = 0; bit < 64; bit++)
  255. {
  256. long mask = 1L << bit;
  257. if ((outputs & mask) == 0)
  258. {
  259. continue;
  260. }
  261. Operand source = GetRegFromBit(bit, baseType);
  262. long offset = NativeContext.GetRegisterOffset(source.GetRegister());
  263. Operand addr = Local(OperandType.I64);
  264. Operation calcOffsOp = new Operation(Instruction.Add, addr, arg0, Const(offset));
  265. block.Append(calcOffsOp);
  266. Operation storeOp = new Operation(Instruction.Store, null, addr, source);
  267. block.Append(storeOp);
  268. }
  269. }
  270. private static Operand GetRegFromBit(int bit, RegisterType baseType)
  271. {
  272. if (bit < RegsCount)
  273. {
  274. return new Operand(bit, baseType, GetOperandType(baseType));
  275. }
  276. else if (baseType == RegisterType.Integer)
  277. {
  278. return new Operand(bit & RegsMask, RegisterType.Flag, OperandType.I32);
  279. }
  280. else
  281. {
  282. throw new ArgumentOutOfRangeException(nameof(bit));
  283. }
  284. }
  285. private static OperandType GetOperandType(RegisterType type)
  286. {
  287. switch (type)
  288. {
  289. case RegisterType.Flag: return OperandType.I32;
  290. case RegisterType.Integer: return OperandType.I64;
  291. case RegisterType.Vector: return OperandType.V128;
  292. }
  293. throw new ArgumentException($"Invalid register type \"{type}\".");
  294. }
  295. private static bool EndsWithReturn(BasicBlock block)
  296. {
  297. if (!(block.GetLastOp() is Operation operation))
  298. {
  299. return false;
  300. }
  301. return operation.Instruction == Instruction.Return;
  302. }
  303. private static long ClearCallerSavedIntRegs(long mask)
  304. {
  305. // TODO: ARM32 support.
  306. mask &= ~(CallerSavedIntRegistersMask | PStateNzcvFlagsMask);
  307. return mask;
  308. }
  309. private static long ClearCallerSavedVecRegs(long mask)
  310. {
  311. // TODO: ARM32 support.
  312. mask &= ~CallerSavedVecRegistersMask;
  313. return mask;
  314. }
  315. }
  316. }