Buffer.cs 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491
  1. using Ryujinx.Cpu.Tracking;
  2. using Ryujinx.Graphics.GAL;
  3. using Ryujinx.Memory.Range;
  4. using Ryujinx.Memory.Tracking;
  5. using System;
  6. using System.Collections.Generic;
  7. using System.Linq;
  8. namespace Ryujinx.Graphics.Gpu.Memory
  9. {
  10. /// <summary>
  11. /// Buffer, used to store vertex and index data, uniform and storage buffers, and others.
  12. /// </summary>
  13. class Buffer : IRange, IDisposable
  14. {
  15. private const ulong GranularBufferThreshold = 4096;
  16. private readonly GpuContext _context;
  17. private readonly PhysicalMemory _physicalMemory;
  18. /// <summary>
  19. /// Host buffer handle.
  20. /// </summary>
  21. public BufferHandle Handle { get; }
  22. /// <summary>
  23. /// Start address of the buffer in guest memory.
  24. /// </summary>
  25. public ulong Address { get; }
  26. /// <summary>
  27. /// Size of the buffer in bytes.
  28. /// </summary>
  29. public ulong Size { get; }
  30. /// <summary>
  31. /// End address of the buffer in guest memory.
  32. /// </summary>
  33. public ulong EndAddress => Address + Size;
  34. /// <summary>
  35. /// Increments when the buffer is (partially) unmapped or disposed.
  36. /// </summary>
  37. public int UnmappedSequence { get; private set; }
  38. /// <summary>
  39. /// Ranges of the buffer that have been modified on the GPU.
  40. /// Ranges defined here cannot be updated from CPU until a CPU waiting sync point is reached.
  41. /// Then, write tracking will signal, wait for GPU sync (generated at the syncpoint) and flush these regions.
  42. /// </summary>
  43. /// <remarks>
  44. /// This is null until at least one modification occurs.
  45. /// </remarks>
  46. private BufferModifiedRangeList _modifiedRanges = null;
  47. private readonly CpuMultiRegionHandle _memoryTrackingGranular;
  48. private readonly CpuRegionHandle _memoryTracking;
  49. private readonly RegionSignal _externalFlushDelegate;
  50. private readonly Action<ulong, ulong> _loadDelegate;
  51. private readonly Action<ulong, ulong> _modifiedDelegate;
  52. private int _sequenceNumber;
  53. private bool _useGranular;
  54. private bool _syncActionRegistered;
  55. /// <summary>
  56. /// Creates a new instance of the buffer.
  57. /// </summary>
  58. /// <param name="context">GPU context that the buffer belongs to</param>
  59. /// <param name="physicalMemory">Physical memory where the buffer is mapped</param>
  60. /// <param name="address">Start address of the buffer</param>
  61. /// <param name="size">Size of the buffer in bytes</param>
  62. /// <param name="baseBuffers">Buffers which this buffer contains, and will inherit tracking handles from</param>
  63. public Buffer(GpuContext context, PhysicalMemory physicalMemory, ulong address, ulong size, IEnumerable<Buffer> baseBuffers = null)
  64. {
  65. _context = context;
  66. _physicalMemory = physicalMemory;
  67. Address = address;
  68. Size = size;
  69. Handle = context.Renderer.CreateBuffer((int)size);
  70. _useGranular = size > GranularBufferThreshold;
  71. IEnumerable<IRegionHandle> baseHandles = null;
  72. if (baseBuffers != null)
  73. {
  74. baseHandles = baseBuffers.SelectMany(buffer =>
  75. {
  76. if (buffer._useGranular)
  77. {
  78. return buffer._memoryTrackingGranular.GetHandles();
  79. }
  80. else
  81. {
  82. return Enumerable.Repeat(buffer._memoryTracking.GetHandle(), 1);
  83. }
  84. });
  85. }
  86. if (_useGranular)
  87. {
  88. _memoryTrackingGranular = physicalMemory.BeginGranularTracking(address, size, baseHandles);
  89. }
  90. else
  91. {
  92. _memoryTracking = physicalMemory.BeginTracking(address, size);
  93. if (baseHandles != null)
  94. {
  95. _memoryTracking.Reprotect(false);
  96. foreach (IRegionHandle handle in baseHandles)
  97. {
  98. if (handle.Dirty)
  99. {
  100. _memoryTracking.Reprotect(true);
  101. }
  102. handle.Dispose();
  103. }
  104. }
  105. }
  106. _externalFlushDelegate = new RegionSignal(ExternalFlush);
  107. _loadDelegate = new Action<ulong, ulong>(LoadRegion);
  108. _modifiedDelegate = new Action<ulong, ulong>(RegionModified);
  109. }
  110. /// <summary>
  111. /// Gets a sub-range from the buffer, from a start address till the end of the buffer.
  112. /// </summary>
  113. /// <remarks>
  114. /// This can be used to bind and use sub-ranges of the buffer on the host API.
  115. /// </remarks>
  116. /// <param name="address">Start address of the sub-range, must be greater than or equal to the buffer address</param>
  117. /// <returns>The buffer sub-range</returns>
  118. public BufferRange GetRange(ulong address)
  119. {
  120. ulong offset = address - Address;
  121. return new BufferRange(Handle, (int)offset, (int)(Size - offset));
  122. }
  123. /// <summary>
  124. /// Gets a sub-range from the buffer.
  125. /// </summary>
  126. /// <remarks>
  127. /// This can be used to bind and use sub-ranges of the buffer on the host API.
  128. /// </remarks>
  129. /// <param name="address">Start address of the sub-range, must be greater than or equal to the buffer address</param>
  130. /// <param name="size">Size in bytes of the sub-range, must be less than or equal to the buffer size</param>
  131. /// <returns>The buffer sub-range</returns>
  132. public BufferRange GetRange(ulong address, ulong size)
  133. {
  134. int offset = (int)(address - Address);
  135. return new BufferRange(Handle, offset, (int)size);
  136. }
  137. /// <summary>
  138. /// Checks if a given range overlaps with the buffer.
  139. /// </summary>
  140. /// <param name="address">Start address of the range</param>
  141. /// <param name="size">Size in bytes of the range</param>
  142. /// <returns>True if the range overlaps, false otherwise</returns>
  143. public bool OverlapsWith(ulong address, ulong size)
  144. {
  145. return Address < address + size && address < EndAddress;
  146. }
  147. /// <summary>
  148. /// Checks if a given range is fully contained in the buffer.
  149. /// </summary>
  150. /// <param name="address">Start address of the range</param>
  151. /// <param name="size">Size in bytes of the range</param>
  152. /// <returns>True if the range is contained, false otherwise</returns>
  153. public bool FullyContains(ulong address, ulong size)
  154. {
  155. return address >= Address && address + size <= EndAddress;
  156. }
  157. /// <summary>
  158. /// Performs guest to host memory synchronization of the buffer data.
  159. /// </summary>
  160. /// <remarks>
  161. /// This causes the buffer data to be overwritten if a write was detected from the CPU,
  162. /// since the last call to this method.
  163. /// </remarks>
  164. /// <param name="address">Start address of the range to synchronize</param>
  165. /// <param name="size">Size in bytes of the range to synchronize</param>
  166. public void SynchronizeMemory(ulong address, ulong size)
  167. {
  168. if (_useGranular)
  169. {
  170. _memoryTrackingGranular.QueryModified(address, size, _modifiedDelegate, _context.SequenceNumber);
  171. }
  172. else
  173. {
  174. if (_context.SequenceNumber != _sequenceNumber && _memoryTracking.DirtyOrVolatile())
  175. {
  176. _memoryTracking.Reprotect();
  177. if (_modifiedRanges != null)
  178. {
  179. _modifiedRanges.ExcludeModifiedRegions(Address, Size, _loadDelegate);
  180. }
  181. else
  182. {
  183. _context.Renderer.SetBufferData(Handle, 0, _physicalMemory.GetSpan(Address, (int)Size));
  184. }
  185. _sequenceNumber = _context.SequenceNumber;
  186. }
  187. }
  188. }
  189. /// <summary>
  190. /// Ensure that the modified range list exists.
  191. /// </summary>
  192. private void EnsureRangeList()
  193. {
  194. if (_modifiedRanges == null)
  195. {
  196. _modifiedRanges = new BufferModifiedRangeList(_context);
  197. }
  198. }
  199. /// <summary>
  200. /// Signal that the given region of the buffer has been modified.
  201. /// </summary>
  202. /// <param name="address">The start address of the modified region</param>
  203. /// <param name="size">The size of the modified region</param>
  204. public void SignalModified(ulong address, ulong size)
  205. {
  206. EnsureRangeList();
  207. _modifiedRanges.SignalModified(address, size);
  208. if (!_syncActionRegistered)
  209. {
  210. _context.RegisterSyncAction(SyncAction);
  211. _syncActionRegistered = true;
  212. }
  213. }
  214. /// <summary>
  215. /// Indicate that mofifications in a given region of this buffer have been overwritten.
  216. /// </summary>
  217. /// <param name="address">The start address of the region</param>
  218. /// <param name="size">The size of the region</param>
  219. public void ClearModified(ulong address, ulong size)
  220. {
  221. if (_modifiedRanges != null)
  222. {
  223. _modifiedRanges.Clear(address, size);
  224. }
  225. }
  226. /// <summary>
  227. /// Action to be performed when a syncpoint is reached after modification.
  228. /// This will register read/write tracking to flush the buffer from GPU when its memory is used.
  229. /// </summary>
  230. private void SyncAction()
  231. {
  232. _syncActionRegistered = false;
  233. if (_useGranular)
  234. {
  235. _modifiedRanges.GetRanges(Address, Size, (address, size) =>
  236. {
  237. _memoryTrackingGranular.RegisterAction(address, size, _externalFlushDelegate);
  238. SynchronizeMemory(address, size);
  239. });
  240. }
  241. else
  242. {
  243. _memoryTracking.RegisterAction(_externalFlushDelegate);
  244. SynchronizeMemory(Address, Size);
  245. }
  246. }
  247. /// <summary>
  248. /// Inherit modified ranges from another buffer.
  249. /// </summary>
  250. /// <param name="from">The buffer to inherit from</param>
  251. public void InheritModifiedRanges(Buffer from)
  252. {
  253. if (from._modifiedRanges != null)
  254. {
  255. if (from._syncActionRegistered && !_syncActionRegistered)
  256. {
  257. _context.RegisterSyncAction(SyncAction);
  258. _syncActionRegistered = true;
  259. }
  260. EnsureRangeList();
  261. _modifiedRanges.InheritRanges(from._modifiedRanges, (ulong address, ulong size) =>
  262. {
  263. if (_useGranular)
  264. {
  265. _memoryTrackingGranular.RegisterAction(address, size, _externalFlushDelegate);
  266. }
  267. else
  268. {
  269. _memoryTracking.RegisterAction(_externalFlushDelegate);
  270. }
  271. });
  272. }
  273. }
  274. /// <summary>
  275. /// Determine if a given region of the buffer has been modified, and must be flushed.
  276. /// </summary>
  277. /// <param name="address">The start address of the region</param>
  278. /// <param name="size">The size of the region</param>
  279. /// <returns></returns>
  280. public bool IsModified(ulong address, ulong size)
  281. {
  282. if (_modifiedRanges != null)
  283. {
  284. return _modifiedRanges.HasRange(address, size);
  285. }
  286. return false;
  287. }
  288. /// <summary>
  289. /// Indicate that a region of the buffer was modified, and must be loaded from memory.
  290. /// </summary>
  291. /// <param name="mAddress">Start address of the modified region</param>
  292. /// <param name="mSize">Size of the modified region</param>
  293. private void RegionModified(ulong mAddress, ulong mSize)
  294. {
  295. if (mAddress < Address)
  296. {
  297. mAddress = Address;
  298. }
  299. ulong maxSize = Address + Size - mAddress;
  300. if (mSize > maxSize)
  301. {
  302. mSize = maxSize;
  303. }
  304. if (_modifiedRanges != null)
  305. {
  306. _modifiedRanges.ExcludeModifiedRegions(mAddress, mSize, _loadDelegate);
  307. }
  308. else
  309. {
  310. LoadRegion(mAddress, mSize);
  311. }
  312. }
  313. /// <summary>
  314. /// Load a region of the buffer from memory.
  315. /// </summary>
  316. /// <param name="mAddress">Start address of the modified region</param>
  317. /// <param name="mSize">Size of the modified region</param>
  318. private void LoadRegion(ulong mAddress, ulong mSize)
  319. {
  320. int offset = (int)(mAddress - Address);
  321. _context.Renderer.SetBufferData(Handle, offset, _physicalMemory.GetSpan(mAddress, (int)mSize));
  322. }
  323. /// <summary>
  324. /// Force a region of the buffer to be dirty. Avoids reprotection and nullifies sequence number check.
  325. /// </summary>
  326. /// <param name="mAddress">Start address of the modified region</param>
  327. /// <param name="mSize">Size of the region to force dirty</param>
  328. public void ForceDirty(ulong mAddress, ulong mSize)
  329. {
  330. if (_modifiedRanges != null)
  331. {
  332. _modifiedRanges.Clear(mAddress, mSize);
  333. }
  334. if (_useGranular)
  335. {
  336. _memoryTrackingGranular.ForceDirty(mAddress, mSize);
  337. }
  338. else
  339. {
  340. _memoryTracking.ForceDirty();
  341. _sequenceNumber--;
  342. }
  343. }
  344. /// <summary>
  345. /// Performs copy of all the buffer data from one buffer to another.
  346. /// </summary>
  347. /// <param name="destination">The destination buffer to copy the data into</param>
  348. /// <param name="dstOffset">The offset of the destination buffer to copy into</param>
  349. public void CopyTo(Buffer destination, int dstOffset)
  350. {
  351. _context.Renderer.Pipeline.CopyBuffer(Handle, destination.Handle, 0, dstOffset, (int)Size);
  352. }
  353. /// <summary>
  354. /// Flushes a range of the buffer.
  355. /// This writes the range data back into guest memory.
  356. /// </summary>
  357. /// <param name="address">Start address of the range</param>
  358. /// <param name="size">Size in bytes of the range</param>
  359. public void Flush(ulong address, ulong size)
  360. {
  361. int offset = (int)(address - Address);
  362. ReadOnlySpan<byte> data = _context.Renderer.GetBufferData(Handle, offset, (int)size);
  363. // TODO: When write tracking shaders, they will need to be aware of changes in overlapping buffers.
  364. _physicalMemory.WriteUntracked(address, data);
  365. }
  366. /// <summary>
  367. /// Align a given address and size region to page boundaries.
  368. /// </summary>
  369. /// <param name="address">The start address of the region</param>
  370. /// <param name="size">The size of the region</param>
  371. /// <returns>The page aligned address and size</returns>
  372. private static (ulong address, ulong size) PageAlign(ulong address, ulong size)
  373. {
  374. ulong pageMask = MemoryManager.PageMask;
  375. ulong rA = address & ~pageMask;
  376. ulong rS = ((address + size + pageMask) & ~pageMask) - rA;
  377. return (rA, rS);
  378. }
  379. /// <summary>
  380. /// Flush modified ranges of the buffer from another thread.
  381. /// This will flush all modifications made before the active SyncNumber was set, and may block to wait for GPU sync.
  382. /// </summary>
  383. /// <param name="address">Address of the memory action</param>
  384. /// <param name="size">Size in bytes</param>
  385. public void ExternalFlush(ulong address, ulong size)
  386. {
  387. _context.Renderer.BackgroundContextAction(() =>
  388. {
  389. var ranges = _modifiedRanges;
  390. if (ranges != null)
  391. {
  392. (address, size) = PageAlign(address, size);
  393. ranges.WaitForAndGetRanges(address, size, Flush);
  394. }
  395. });
  396. }
  397. /// <summary>
  398. /// Called when part of the memory for this buffer has been unmapped.
  399. /// Calls are from non-GPU threads.
  400. /// </summary>
  401. /// <param name="address">Start address of the unmapped region</param>
  402. /// <param name="size">Size of the unmapped region</param>
  403. public void Unmapped(ulong address, ulong size)
  404. {
  405. _modifiedRanges?.Clear(address, size);
  406. UnmappedSequence++;
  407. }
  408. /// <summary>
  409. /// Disposes the host buffer's data, not its tracking handles.
  410. /// </summary>
  411. public void DisposeData()
  412. {
  413. _modifiedRanges?.Clear();
  414. _context.Renderer.DeleteBuffer(Handle);
  415. UnmappedSequence++;
  416. }
  417. /// <summary>
  418. /// Disposes the host buffer.
  419. /// </summary>
  420. public void Dispose()
  421. {
  422. _memoryTrackingGranular?.Dispose();
  423. _memoryTracking?.Dispose();
  424. DisposeData();
  425. }
  426. }
  427. }