BufferHolder.cs 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512
  1. using Ryujinx.Graphics.GAL;
  2. using Silk.NET.Vulkan;
  3. using System;
  4. using System.Runtime.CompilerServices;
  5. using VkBuffer = Silk.NET.Vulkan.Buffer;
  6. using VkFormat = Silk.NET.Vulkan.Format;
  7. namespace Ryujinx.Graphics.Vulkan
  8. {
  9. class BufferHolder : IDisposable
  10. {
  11. private const int MaxUpdateBufferSize = 0x10000;
  12. public const AccessFlags DefaultAccessFlags =
  13. AccessFlags.IndirectCommandReadBit |
  14. AccessFlags.ShaderReadBit |
  15. AccessFlags.ShaderWriteBit |
  16. AccessFlags.TransferReadBit |
  17. AccessFlags.TransferWriteBit |
  18. AccessFlags.UniformReadBit;
  19. private readonly VulkanRenderer _gd;
  20. private readonly Device _device;
  21. private readonly MemoryAllocation _allocation;
  22. private readonly Auto<DisposableBuffer> _buffer;
  23. private readonly Auto<MemoryAllocation> _allocationAuto;
  24. private readonly ulong _bufferHandle;
  25. private CacheByRange<BufferHolder> _cachedConvertedBuffers;
  26. public int Size { get; }
  27. private IntPtr _map;
  28. private readonly MultiFenceHolder _waitable;
  29. private bool _lastAccessIsWrite;
  30. public BufferHolder(VulkanRenderer gd, Device device, VkBuffer buffer, MemoryAllocation allocation, int size)
  31. {
  32. _gd = gd;
  33. _device = device;
  34. _allocation = allocation;
  35. _allocationAuto = new Auto<MemoryAllocation>(allocation);
  36. _waitable = new MultiFenceHolder(size);
  37. _buffer = new Auto<DisposableBuffer>(new DisposableBuffer(gd.Api, device, buffer), _waitable, _allocationAuto);
  38. _bufferHandle = buffer.Handle;
  39. Size = size;
  40. _map = allocation.HostPointer;
  41. }
  42. public unsafe Auto<DisposableBufferView> CreateView(VkFormat format, int offset, int size)
  43. {
  44. var bufferViewCreateInfo = new BufferViewCreateInfo()
  45. {
  46. SType = StructureType.BufferViewCreateInfo,
  47. Buffer = new VkBuffer(_bufferHandle),
  48. Format = format,
  49. Offset = (uint)offset,
  50. Range = (uint)size
  51. };
  52. _gd.Api.CreateBufferView(_device, bufferViewCreateInfo, null, out var bufferView).ThrowOnError();
  53. return new Auto<DisposableBufferView>(new DisposableBufferView(_gd.Api, _device, bufferView), _waitable, _buffer);
  54. }
  55. public unsafe void InsertBarrier(CommandBuffer commandBuffer, bool isWrite)
  56. {
  57. // If the last access is write, we always need a barrier to be sure we will read or modify
  58. // the correct data.
  59. // If the last access is read, and current one is a write, we need to wait until the
  60. // read finishes to avoid overwriting data still in use.
  61. // Otherwise, if the last access is a read and the current one too, we don't need barriers.
  62. bool needsBarrier = isWrite || _lastAccessIsWrite;
  63. _lastAccessIsWrite = isWrite;
  64. if (needsBarrier)
  65. {
  66. MemoryBarrier memoryBarrier = new MemoryBarrier()
  67. {
  68. SType = StructureType.MemoryBarrier,
  69. SrcAccessMask = DefaultAccessFlags,
  70. DstAccessMask = DefaultAccessFlags
  71. };
  72. _gd.Api.CmdPipelineBarrier(
  73. commandBuffer,
  74. PipelineStageFlags.AllCommandsBit,
  75. PipelineStageFlags.AllCommandsBit,
  76. DependencyFlags.DeviceGroupBit,
  77. 1,
  78. memoryBarrier,
  79. 0,
  80. null,
  81. 0,
  82. null);
  83. }
  84. }
  85. public Auto<DisposableBuffer> GetBuffer()
  86. {
  87. return _buffer;
  88. }
  89. public Auto<DisposableBuffer> GetBuffer(CommandBuffer commandBuffer, bool isWrite = false)
  90. {
  91. if (isWrite)
  92. {
  93. SignalWrite(0, Size);
  94. }
  95. return _buffer;
  96. }
  97. public Auto<DisposableBuffer> GetBuffer(CommandBuffer commandBuffer, int offset, int size, bool isWrite = false)
  98. {
  99. if (isWrite)
  100. {
  101. SignalWrite(offset, size);
  102. }
  103. return _buffer;
  104. }
  105. public void SignalWrite(int offset, int size)
  106. {
  107. if (offset == 0 && size == Size)
  108. {
  109. _cachedConvertedBuffers.Clear();
  110. }
  111. else
  112. {
  113. _cachedConvertedBuffers.ClearRange(offset, size);
  114. }
  115. }
  116. public BufferHandle GetHandle()
  117. {
  118. var handle = _bufferHandle;
  119. return Unsafe.As<ulong, BufferHandle>(ref handle);
  120. }
  121. public unsafe IntPtr Map(int offset, int mappingSize)
  122. {
  123. return _map;
  124. }
  125. public unsafe ReadOnlySpan<byte> GetData(int offset, int size)
  126. {
  127. if (_map != IntPtr.Zero)
  128. {
  129. return GetDataStorage(offset, size);
  130. }
  131. else
  132. {
  133. BackgroundResource resource = _gd.BackgroundResources.Get();
  134. if (_gd.CommandBufferPool.OwnedByCurrentThread)
  135. {
  136. _gd.FlushAllCommands();
  137. return resource.GetFlushBuffer().GetBufferData(_gd.CommandBufferPool, this, offset, size);
  138. }
  139. else
  140. {
  141. return resource.GetFlushBuffer().GetBufferData(resource.GetPool(), this, offset, size);
  142. }
  143. }
  144. }
  145. public unsafe Span<byte> GetDataStorage(int offset, int size)
  146. {
  147. int mappingSize = Math.Min(size, Size - offset);
  148. if (_map != IntPtr.Zero)
  149. {
  150. return new Span<byte>((void*)(_map + offset), mappingSize);
  151. }
  152. throw new InvalidOperationException("The buffer is not host mapped.");
  153. }
  154. public unsafe void SetData(int offset, ReadOnlySpan<byte> data, CommandBufferScoped? cbs = null, Action endRenderPass = null)
  155. {
  156. int dataSize = Math.Min(data.Length, Size - offset);
  157. if (dataSize == 0)
  158. {
  159. return;
  160. }
  161. if (_map != IntPtr.Zero)
  162. {
  163. // If persistently mapped, set the data directly if the buffer is not currently in use.
  164. bool isRented = _buffer.HasRentedCommandBufferDependency(_gd.CommandBufferPool);
  165. // If the buffer is rented, take a little more time and check if the use overlaps this handle.
  166. bool needsFlush = isRented && _waitable.IsBufferRangeInUse(offset, dataSize);
  167. if (!needsFlush)
  168. {
  169. WaitForFences(offset, dataSize);
  170. data.Slice(0, dataSize).CopyTo(new Span<byte>((void*)(_map + offset), dataSize));
  171. SignalWrite(offset, dataSize);
  172. return;
  173. }
  174. }
  175. if (cbs != null &&
  176. _gd.PipelineInternal.RenderPassActive &&
  177. !(_buffer.HasCommandBufferDependency(cbs.Value) &&
  178. _waitable.IsBufferRangeInUse(cbs.Value.CommandBufferIndex, offset, dataSize)))
  179. {
  180. // If the buffer hasn't been used on the command buffer yet, try to preload the data.
  181. // This avoids ending and beginning render passes on each buffer data upload.
  182. cbs = _gd.PipelineInternal.GetPreloadCommandBuffer();
  183. endRenderPass = null;
  184. }
  185. if (cbs == null ||
  186. !VulkanConfiguration.UseFastBufferUpdates ||
  187. data.Length > MaxUpdateBufferSize ||
  188. !TryPushData(cbs.Value, endRenderPass, offset, data))
  189. {
  190. _gd.BufferManager.StagingBuffer.PushData(_gd.CommandBufferPool, cbs, endRenderPass, this, offset, data);
  191. }
  192. }
  193. public unsafe void SetDataUnchecked(int offset, ReadOnlySpan<byte> data)
  194. {
  195. int dataSize = Math.Min(data.Length, Size - offset);
  196. if (dataSize == 0)
  197. {
  198. return;
  199. }
  200. if (_map != IntPtr.Zero)
  201. {
  202. data.Slice(0, dataSize).CopyTo(new Span<byte>((void*)(_map + offset), dataSize));
  203. }
  204. else
  205. {
  206. _gd.BufferManager.StagingBuffer.PushData(_gd.CommandBufferPool, null, null, this, offset, data);
  207. }
  208. }
  209. public void SetDataInline(CommandBufferScoped cbs, Action endRenderPass, int dstOffset, ReadOnlySpan<byte> data)
  210. {
  211. if (!TryPushData(cbs, endRenderPass, dstOffset, data))
  212. {
  213. throw new ArgumentException($"Invalid offset 0x{dstOffset:X} or data size 0x{data.Length:X}.");
  214. }
  215. }
  216. private unsafe bool TryPushData(CommandBufferScoped cbs, Action endRenderPass, int dstOffset, ReadOnlySpan<byte> data)
  217. {
  218. if ((dstOffset & 3) != 0 || (data.Length & 3) != 0)
  219. {
  220. return false;
  221. }
  222. endRenderPass?.Invoke();
  223. var dstBuffer = GetBuffer(cbs.CommandBuffer, dstOffset, data.Length, true).Get(cbs, dstOffset, data.Length).Value;
  224. InsertBufferBarrier(
  225. _gd,
  226. cbs.CommandBuffer,
  227. dstBuffer,
  228. DefaultAccessFlags,
  229. AccessFlags.TransferWriteBit,
  230. PipelineStageFlags.AllCommandsBit,
  231. PipelineStageFlags.TransferBit,
  232. dstOffset,
  233. data.Length);
  234. fixed (byte* pData = data)
  235. {
  236. for (ulong offset = 0; offset < (ulong)data.Length;)
  237. {
  238. ulong size = Math.Min(MaxUpdateBufferSize, (ulong)data.Length - offset);
  239. _gd.Api.CmdUpdateBuffer(cbs.CommandBuffer, dstBuffer, (ulong)dstOffset + offset, size, pData + offset);
  240. offset += size;
  241. }
  242. }
  243. InsertBufferBarrier(
  244. _gd,
  245. cbs.CommandBuffer,
  246. dstBuffer,
  247. AccessFlags.TransferWriteBit,
  248. DefaultAccessFlags,
  249. PipelineStageFlags.TransferBit,
  250. PipelineStageFlags.AllCommandsBit,
  251. dstOffset,
  252. data.Length);
  253. return true;
  254. }
  255. public static unsafe void Copy(
  256. VulkanRenderer gd,
  257. CommandBufferScoped cbs,
  258. Auto<DisposableBuffer> src,
  259. Auto<DisposableBuffer> dst,
  260. int srcOffset,
  261. int dstOffset,
  262. int size)
  263. {
  264. var srcBuffer = src.Get(cbs, srcOffset, size).Value;
  265. var dstBuffer = dst.Get(cbs, dstOffset, size).Value;
  266. InsertBufferBarrier(
  267. gd,
  268. cbs.CommandBuffer,
  269. dstBuffer,
  270. DefaultAccessFlags,
  271. AccessFlags.TransferWriteBit,
  272. PipelineStageFlags.AllCommandsBit,
  273. PipelineStageFlags.TransferBit,
  274. dstOffset,
  275. size);
  276. var region = new BufferCopy((ulong)srcOffset, (ulong)dstOffset, (ulong)size);
  277. gd.Api.CmdCopyBuffer(cbs.CommandBuffer, srcBuffer, dstBuffer, 1, &region);
  278. InsertBufferBarrier(
  279. gd,
  280. cbs.CommandBuffer,
  281. dstBuffer,
  282. AccessFlags.TransferWriteBit,
  283. DefaultAccessFlags,
  284. PipelineStageFlags.TransferBit,
  285. PipelineStageFlags.AllCommandsBit,
  286. dstOffset,
  287. size);
  288. }
  289. public static unsafe void InsertBufferBarrier(
  290. VulkanRenderer gd,
  291. CommandBuffer commandBuffer,
  292. VkBuffer buffer,
  293. AccessFlags srcAccessMask,
  294. AccessFlags dstAccessMask,
  295. PipelineStageFlags srcStageMask,
  296. PipelineStageFlags dstStageMask,
  297. int offset,
  298. int size)
  299. {
  300. BufferMemoryBarrier memoryBarrier = new BufferMemoryBarrier()
  301. {
  302. SType = StructureType.BufferMemoryBarrier,
  303. SrcAccessMask = srcAccessMask,
  304. DstAccessMask = dstAccessMask,
  305. SrcQueueFamilyIndex = Vk.QueueFamilyIgnored,
  306. DstQueueFamilyIndex = Vk.QueueFamilyIgnored,
  307. Buffer = buffer,
  308. Offset = (ulong)offset,
  309. Size = (ulong)size
  310. };
  311. gd.Api.CmdPipelineBarrier(
  312. commandBuffer,
  313. srcStageMask,
  314. dstStageMask,
  315. 0,
  316. 0,
  317. null,
  318. 1,
  319. memoryBarrier,
  320. 0,
  321. null);
  322. }
  323. public void WaitForFences()
  324. {
  325. _waitable.WaitForFences(_gd.Api, _device);
  326. }
  327. public void WaitForFences(int offset, int size)
  328. {
  329. _waitable.WaitForFences(_gd.Api, _device, offset, size);
  330. }
  331. private bool BoundToRange(int offset, ref int size)
  332. {
  333. if (offset >= Size)
  334. {
  335. return false;
  336. }
  337. size = Math.Min(Size - offset, size);
  338. return true;
  339. }
  340. public Auto<DisposableBuffer> GetBufferI8ToI16(CommandBufferScoped cbs, int offset, int size)
  341. {
  342. if (!BoundToRange(offset, ref size))
  343. {
  344. return null;
  345. }
  346. var key = new I8ToI16CacheKey(_gd);
  347. if (!_cachedConvertedBuffers.TryGetValue(offset, size, key, out var holder))
  348. {
  349. holder = _gd.BufferManager.Create(_gd, (size * 2 + 3) & ~3);
  350. _gd.PipelineInternal.EndRenderPass();
  351. _gd.HelperShader.ConvertI8ToI16(_gd, cbs, this, holder, offset, size);
  352. key.SetBuffer(holder.GetBuffer());
  353. _cachedConvertedBuffers.Add(offset, size, key, holder);
  354. }
  355. return holder.GetBuffer();
  356. }
  357. public Auto<DisposableBuffer> GetAlignedVertexBuffer(CommandBufferScoped cbs, int offset, int size, int stride, int alignment)
  358. {
  359. if (!BoundToRange(offset, ref size))
  360. {
  361. return null;
  362. }
  363. var key = new AlignedVertexBufferCacheKey(_gd, stride, alignment);
  364. if (!_cachedConvertedBuffers.TryGetValue(offset, size, key, out var holder))
  365. {
  366. int alignedStride = (stride + (alignment - 1)) & -alignment;
  367. holder = _gd.BufferManager.Create(_gd, (size / stride) * alignedStride);
  368. _gd.PipelineInternal.EndRenderPass();
  369. _gd.HelperShader.ChangeStride(_gd, cbs, this, holder, offset, size, stride, alignedStride);
  370. key.SetBuffer(holder.GetBuffer());
  371. _cachedConvertedBuffers.Add(offset, size, key, holder);
  372. }
  373. return holder.GetBuffer();
  374. }
  375. public Auto<DisposableBuffer> GetBufferTopologyConversion(CommandBufferScoped cbs, int offset, int size, IndexBufferPattern pattern, int indexSize)
  376. {
  377. if (!BoundToRange(offset, ref size))
  378. {
  379. return null;
  380. }
  381. var key = new TopologyConversionCacheKey(_gd, pattern, indexSize);
  382. if (!_cachedConvertedBuffers.TryGetValue(offset, size, key, out var holder))
  383. {
  384. // The destination index size is always I32.
  385. int indexCount = size / indexSize;
  386. int convertedCount = pattern.GetConvertedCount(indexCount);
  387. holder = _gd.BufferManager.Create(_gd, convertedCount * 4);
  388. _gd.PipelineInternal.EndRenderPass();
  389. _gd.HelperShader.ConvertIndexBuffer(_gd, cbs, this, holder, pattern, indexSize, offset, indexCount);
  390. key.SetBuffer(holder.GetBuffer());
  391. _cachedConvertedBuffers.Add(offset, size, key, holder);
  392. }
  393. return holder.GetBuffer();
  394. }
  395. public bool TryGetCachedConvertedBuffer(int offset, int size, ICacheKey key, out BufferHolder holder)
  396. {
  397. return _cachedConvertedBuffers.TryGetValue(offset, size, key, out holder);
  398. }
  399. public void AddCachedConvertedBuffer(int offset, int size, ICacheKey key, BufferHolder holder)
  400. {
  401. _cachedConvertedBuffers.Add(offset, size, key, holder);
  402. }
  403. public void AddCachedConvertedBufferDependency(int offset, int size, ICacheKey key, Dependency dependency)
  404. {
  405. _cachedConvertedBuffers.AddDependency(offset, size, key, dependency);
  406. }
  407. public void RemoveCachedConvertedBuffer(int offset, int size, ICacheKey key)
  408. {
  409. _cachedConvertedBuffers.Remove(offset, size, key);
  410. }
  411. public void Dispose()
  412. {
  413. _gd.PipelineInternal?.FlushCommandsIfWeightExceeding(_buffer, (ulong)Size);
  414. _buffer.Dispose();
  415. _allocationAuto.Dispose();
  416. _cachedConvertedBuffers.Dispose();
  417. }
  418. }
  419. }