RegisterUsage.cs 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491
  1. using Ryujinx.Graphics.Shader.Decoders;
  2. using Ryujinx.Graphics.Shader.IntermediateRepresentation;
  3. using System;
  4. using System.Collections.Generic;
  5. using System.Diagnostics;
  6. using System.Numerics;
  7. namespace Ryujinx.Graphics.Shader.Translation
  8. {
  9. static class RegisterUsage
  10. {
  11. private const int RegsCount = 256;
  12. private const int RegsMask = RegsCount - 1;
  13. private const int GprMasks = 4;
  14. private const int PredMasks = 1;
  15. private const int FlagMasks = 1;
  16. private const int TotalMasks = GprMasks + PredMasks + FlagMasks;
  17. private struct RegisterMask : IEquatable<RegisterMask>
  18. {
  19. public long GprMask0 { get; set; }
  20. public long GprMask1 { get; set; }
  21. public long GprMask2 { get; set; }
  22. public long GprMask3 { get; set; }
  23. public long PredMask { get; set; }
  24. public long FlagMask { get; set; }
  25. public RegisterMask(long gprMask0, long gprMask1, long gprMask2, long gprMask3, long predMask, long flagMask)
  26. {
  27. GprMask0 = gprMask0;
  28. GprMask1 = gprMask1;
  29. GprMask2 = gprMask2;
  30. GprMask3 = gprMask3;
  31. PredMask = predMask;
  32. FlagMask = flagMask;
  33. }
  34. public readonly long GetMask(int index)
  35. {
  36. return index switch
  37. {
  38. 0 => GprMask0,
  39. 1 => GprMask1,
  40. 2 => GprMask2,
  41. 3 => GprMask3,
  42. 4 => PredMask,
  43. 5 => FlagMask,
  44. _ => throw new ArgumentOutOfRangeException(nameof(index)),
  45. };
  46. }
  47. public static RegisterMask operator &(RegisterMask x, RegisterMask y)
  48. {
  49. return new RegisterMask(
  50. x.GprMask0 & y.GprMask0,
  51. x.GprMask1 & y.GprMask1,
  52. x.GprMask2 & y.GprMask2,
  53. x.GprMask3 & y.GprMask3,
  54. x.PredMask & y.PredMask,
  55. x.FlagMask & y.FlagMask);
  56. }
  57. public static RegisterMask operator |(RegisterMask x, RegisterMask y)
  58. {
  59. return new RegisterMask(
  60. x.GprMask0 | y.GprMask0,
  61. x.GprMask1 | y.GprMask1,
  62. x.GprMask2 | y.GprMask2,
  63. x.GprMask3 | y.GprMask3,
  64. x.PredMask | y.PredMask,
  65. x.FlagMask | y.FlagMask);
  66. }
  67. public static RegisterMask operator ~(RegisterMask x)
  68. {
  69. return new RegisterMask(
  70. ~x.GprMask0,
  71. ~x.GprMask1,
  72. ~x.GprMask2,
  73. ~x.GprMask3,
  74. ~x.PredMask,
  75. ~x.FlagMask);
  76. }
  77. public static bool operator ==(RegisterMask x, RegisterMask y)
  78. {
  79. return x.Equals(y);
  80. }
  81. public static bool operator !=(RegisterMask x, RegisterMask y)
  82. {
  83. return !x.Equals(y);
  84. }
  85. public readonly override bool Equals(object obj)
  86. {
  87. return obj is RegisterMask regMask && Equals(regMask);
  88. }
  89. public readonly bool Equals(RegisterMask other)
  90. {
  91. return GprMask0 == other.GprMask0 &&
  92. GprMask1 == other.GprMask1 &&
  93. GprMask2 == other.GprMask2 &&
  94. GprMask3 == other.GprMask3 &&
  95. PredMask == other.PredMask &&
  96. FlagMask == other.FlagMask;
  97. }
  98. public readonly override int GetHashCode()
  99. {
  100. return HashCode.Combine(GprMask0, GprMask1, GprMask2, GprMask3, PredMask, FlagMask);
  101. }
  102. }
  103. public readonly struct FunctionRegisterUsage
  104. {
  105. public Register[] InArguments { get; }
  106. public Register[] OutArguments { get; }
  107. public FunctionRegisterUsage(Register[] inArguments, Register[] outArguments)
  108. {
  109. InArguments = inArguments;
  110. OutArguments = outArguments;
  111. }
  112. }
  113. public static FunctionRegisterUsage RunPass(ControlFlowGraph cfg)
  114. {
  115. List<Register> inArguments = new();
  116. List<Register> outArguments = new();
  117. // Compute local register inputs and outputs used inside blocks.
  118. RegisterMask[] localInputs = new RegisterMask[cfg.Blocks.Length];
  119. RegisterMask[] localOutputs = new RegisterMask[cfg.Blocks.Length];
  120. foreach (BasicBlock block in cfg.Blocks)
  121. {
  122. for (LinkedListNode<INode> node = block.Operations.First; node != null; node = node.Next)
  123. {
  124. Operation operation = node.Value as Operation;
  125. for (int srcIndex = 0; srcIndex < operation.SourcesCount; srcIndex++)
  126. {
  127. Operand source = operation.GetSource(srcIndex);
  128. if (source.Type != OperandType.Register)
  129. {
  130. continue;
  131. }
  132. Register register = source.GetRegister();
  133. localInputs[block.Index] |= GetMask(register) & ~localOutputs[block.Index];
  134. }
  135. for (int dstIndex = 0; dstIndex < operation.DestsCount; dstIndex++)
  136. {
  137. Operand dest = operation.GetDest(dstIndex);
  138. if (dest != null && dest.Type == OperandType.Register)
  139. {
  140. localOutputs[block.Index] |= GetMask(dest.GetRegister());
  141. }
  142. }
  143. }
  144. }
  145. // Compute global register inputs and outputs used across blocks.
  146. RegisterMask[] globalCmnOutputs = new RegisterMask[cfg.Blocks.Length];
  147. RegisterMask[] globalInputs = new RegisterMask[cfg.Blocks.Length];
  148. RegisterMask[] globalOutputs = new RegisterMask[cfg.Blocks.Length];
  149. RegisterMask allOutputs = new();
  150. RegisterMask allCmnOutputs = new(-1L, -1L, -1L, -1L, -1L, -1L);
  151. bool modified;
  152. bool firstPass = true;
  153. do
  154. {
  155. modified = false;
  156. // Compute register outputs.
  157. for (int index = cfg.PostOrderBlocks.Length - 1; index >= 0; index--)
  158. {
  159. BasicBlock block = cfg.PostOrderBlocks[index];
  160. if (block.Predecessors.Count != 0)
  161. {
  162. BasicBlock predecessor = block.Predecessors[0];
  163. RegisterMask cmnOutputs = localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  164. RegisterMask outputs = globalOutputs[predecessor.Index];
  165. for (int pIndex = 1; pIndex < block.Predecessors.Count; pIndex++)
  166. {
  167. predecessor = block.Predecessors[pIndex];
  168. cmnOutputs &= localOutputs[predecessor.Index] | globalCmnOutputs[predecessor.Index];
  169. outputs |= globalOutputs[predecessor.Index];
  170. }
  171. globalInputs[block.Index] |= outputs & ~cmnOutputs;
  172. if (!firstPass)
  173. {
  174. cmnOutputs &= globalCmnOutputs[block.Index];
  175. }
  176. if (EndsWithReturn(block))
  177. {
  178. allCmnOutputs &= cmnOutputs | localOutputs[block.Index];
  179. }
  180. if (Exchange(globalCmnOutputs, block.Index, cmnOutputs))
  181. {
  182. modified = true;
  183. }
  184. outputs |= localOutputs[block.Index];
  185. if (Exchange(globalOutputs, block.Index, globalOutputs[block.Index] | outputs))
  186. {
  187. allOutputs |= outputs;
  188. modified = true;
  189. }
  190. }
  191. else if (Exchange(globalOutputs, block.Index, localOutputs[block.Index]))
  192. {
  193. allOutputs |= localOutputs[block.Index];
  194. modified = true;
  195. }
  196. }
  197. // Compute register inputs.
  198. for (int index = 0; index < cfg.PostOrderBlocks.Length; index++)
  199. {
  200. BasicBlock block = cfg.PostOrderBlocks[index];
  201. RegisterMask inputs = localInputs[block.Index];
  202. if (block.Next != null)
  203. {
  204. inputs |= globalInputs[block.Next.Index];
  205. }
  206. if (block.Branch != null)
  207. {
  208. inputs |= globalInputs[block.Branch.Index];
  209. }
  210. inputs &= ~globalCmnOutputs[block.Index];
  211. if (Exchange(globalInputs, block.Index, globalInputs[block.Index] | inputs))
  212. {
  213. modified = true;
  214. }
  215. }
  216. firstPass = false;
  217. }
  218. while (modified);
  219. // Insert load and store context instructions where needed.
  220. foreach (BasicBlock block in cfg.Blocks)
  221. {
  222. // The only block without any predecessor should be the entry block.
  223. // It always needs a context load as it is the first block to run.
  224. if (block.Predecessors.Count == 0)
  225. {
  226. RegisterMask inputs = globalInputs[block.Index] | (allOutputs & ~allCmnOutputs);
  227. LoadLocals(block, inputs, inArguments);
  228. }
  229. if (EndsWithReturn(block))
  230. {
  231. StoreLocals(block, allOutputs, inArguments.Count, outArguments);
  232. }
  233. }
  234. return new FunctionRegisterUsage(inArguments.ToArray(), outArguments.ToArray());
  235. }
  236. public static void FixupCalls(BasicBlock[] blocks, FunctionRegisterUsage[] frus)
  237. {
  238. foreach (BasicBlock block in blocks)
  239. {
  240. for (LinkedListNode<INode> node = block.Operations.First; node != null; node = node.Next)
  241. {
  242. Operation operation = node.Value as Operation;
  243. if (operation.Inst == Instruction.Call)
  244. {
  245. Operand funcId = operation.GetSource(0);
  246. Debug.Assert(funcId.Type == OperandType.Constant);
  247. var fru = frus[funcId.Value];
  248. Operand[] inRegs = new Operand[fru.InArguments.Length];
  249. for (int i = 0; i < fru.InArguments.Length; i++)
  250. {
  251. inRegs[i] = OperandHelper.Register(fru.InArguments[i]);
  252. }
  253. operation.AppendSources(inRegs);
  254. Operand[] outRegs = new Operand[1 + fru.OutArguments.Length];
  255. for (int i = 0; i < fru.OutArguments.Length; i++)
  256. {
  257. outRegs[1 + i] = OperandHelper.Register(fru.OutArguments[i]);
  258. }
  259. operation.AppendDests(outRegs);
  260. }
  261. }
  262. }
  263. }
  264. private static bool StartsWith(BasicBlock block, Instruction inst)
  265. {
  266. if (block.Operations.Count == 0)
  267. {
  268. return false;
  269. }
  270. return block.Operations.First.Value is Operation operation && operation.Inst == inst;
  271. }
  272. private static bool EndsWith(BasicBlock block, Instruction inst)
  273. {
  274. if (block.Operations.Count == 0)
  275. {
  276. return false;
  277. }
  278. return block.Operations.Last.Value is Operation operation && operation.Inst == inst;
  279. }
  280. private static RegisterMask GetMask(Register register)
  281. {
  282. Span<long> gprMasks = stackalloc long[4];
  283. long predMask = 0;
  284. long flagMask = 0;
  285. switch (register.Type)
  286. {
  287. case RegisterType.Gpr:
  288. gprMasks[register.Index >> 6] = 1L << (register.Index & 0x3f);
  289. break;
  290. case RegisterType.Predicate:
  291. predMask = 1L << register.Index;
  292. break;
  293. case RegisterType.Flag:
  294. flagMask = 1L << register.Index;
  295. break;
  296. }
  297. return new RegisterMask(gprMasks[0], gprMasks[1], gprMasks[2], gprMasks[3], predMask, flagMask);
  298. }
  299. private static bool Exchange(RegisterMask[] masks, int blkIndex, RegisterMask value)
  300. {
  301. RegisterMask oldValue = masks[blkIndex];
  302. masks[blkIndex] = value;
  303. return oldValue != value;
  304. }
  305. private static void LoadLocals(BasicBlock block, RegisterMask masks, List<Register> inArguments)
  306. {
  307. bool fillArgsList = inArguments.Count == 0;
  308. LinkedListNode<INode> node = null;
  309. int argIndex = 0;
  310. for (int i = 0; i < TotalMasks; i++)
  311. {
  312. (RegisterType regType, int baseRegIndex) = GetRegTypeAndBaseIndex(i);
  313. long mask = masks.GetMask(i);
  314. while (mask != 0)
  315. {
  316. int bit = BitOperations.TrailingZeroCount(mask);
  317. mask &= ~(1L << bit);
  318. Register register = new(baseRegIndex + bit, regType);
  319. if (fillArgsList)
  320. {
  321. inArguments.Add(register);
  322. }
  323. Operation copyOp = new(Instruction.Copy, OperandHelper.Register(register), OperandHelper.Argument(argIndex++));
  324. if (node == null)
  325. {
  326. node = block.Operations.AddFirst(copyOp);
  327. }
  328. else
  329. {
  330. node = block.Operations.AddAfter(node, copyOp);
  331. }
  332. }
  333. }
  334. Debug.Assert(argIndex <= inArguments.Count);
  335. }
  336. private static void StoreLocals(BasicBlock block, RegisterMask masks, int inArgumentsCount, List<Register> outArguments)
  337. {
  338. LinkedListNode<INode> node = null;
  339. int argIndex = inArgumentsCount;
  340. bool fillArgsList = outArguments.Count == 0;
  341. for (int i = 0; i < TotalMasks; i++)
  342. {
  343. (RegisterType regType, int baseRegIndex) = GetRegTypeAndBaseIndex(i);
  344. long mask = masks.GetMask(i);
  345. while (mask != 0)
  346. {
  347. int bit = BitOperations.TrailingZeroCount(mask);
  348. mask &= ~(1L << bit);
  349. Register register = new(baseRegIndex + bit, regType);
  350. if (fillArgsList)
  351. {
  352. outArguments.Add(register);
  353. }
  354. Operation copyOp = new(Instruction.Copy, OperandHelper.Argument(argIndex++), OperandHelper.Register(register));
  355. if (node == null)
  356. {
  357. node = block.Operations.AddBefore(block.Operations.Last, copyOp);
  358. }
  359. else
  360. {
  361. node = block.Operations.AddAfter(node, copyOp);
  362. }
  363. }
  364. }
  365. Debug.Assert(argIndex <= inArgumentsCount + outArguments.Count);
  366. }
  367. private static (RegisterType RegType, int BaseRegIndex) GetRegTypeAndBaseIndex(int i)
  368. {
  369. RegisterType regType = RegisterType.Gpr;
  370. int baseRegIndex = 0;
  371. if (i < GprMasks)
  372. {
  373. baseRegIndex = i * sizeof(long) * 8;
  374. }
  375. else if (i == GprMasks)
  376. {
  377. regType = RegisterType.Predicate;
  378. }
  379. else
  380. {
  381. regType = RegisterType.Flag;
  382. }
  383. return (regType, baseRegIndex);
  384. }
  385. private static bool EndsWithReturn(BasicBlock block)
  386. {
  387. if (block.GetLastOp() is not Operation operation)
  388. {
  389. return false;
  390. }
  391. return operation.Inst == Instruction.Return;
  392. }
  393. }
  394. }