VulkanRenderer.cs 35 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885
  1. using Ryujinx.Common.Configuration;
  2. using Ryujinx.Common.Logging;
  3. using Ryujinx.Graphics.GAL;
  4. using Ryujinx.Graphics.Shader;
  5. using Ryujinx.Graphics.Shader.Translation;
  6. using Ryujinx.Graphics.Vulkan.MoltenVK;
  7. using Ryujinx.Graphics.Vulkan.Queries;
  8. using Silk.NET.Vulkan;
  9. using Silk.NET.Vulkan.Extensions.EXT;
  10. using Silk.NET.Vulkan.Extensions.KHR;
  11. using System;
  12. using System.Collections.Generic;
  13. using System.Runtime.InteropServices;
  14. using Format = Ryujinx.Graphics.GAL.Format;
  15. using PrimitiveTopology = Ryujinx.Graphics.GAL.PrimitiveTopology;
  16. using SamplerCreateInfo = Ryujinx.Graphics.GAL.SamplerCreateInfo;
  17. namespace Ryujinx.Graphics.Vulkan
  18. {
  19. public sealed class VulkanRenderer : IRenderer
  20. {
  21. private VulkanInstance _instance;
  22. private SurfaceKHR _surface;
  23. private VulkanPhysicalDevice _physicalDevice;
  24. private Device _device;
  25. private WindowBase _window;
  26. private bool _initialized;
  27. internal FormatCapabilities FormatCapabilities { get; private set; }
  28. internal HardwareCapabilities Capabilities;
  29. internal Vk Api { get; private set; }
  30. internal KhrSurface SurfaceApi { get; private set; }
  31. internal KhrSwapchain SwapchainApi { get; private set; }
  32. internal ExtConditionalRendering ConditionalRenderingApi { get; private set; }
  33. internal ExtExtendedDynamicState ExtendedDynamicStateApi { get; private set; }
  34. internal KhrPushDescriptor PushDescriptorApi { get; private set; }
  35. internal ExtTransformFeedback TransformFeedbackApi { get; private set; }
  36. internal KhrDrawIndirectCount DrawIndirectCountApi { get; private set; }
  37. internal uint QueueFamilyIndex { get; private set; }
  38. internal Queue Queue { get; private set; }
  39. internal Queue BackgroundQueue { get; private set; }
  40. internal object BackgroundQueueLock { get; private set; }
  41. internal object QueueLock { get; private set; }
  42. internal MemoryAllocator MemoryAllocator { get; private set; }
  43. internal HostMemoryAllocator HostMemoryAllocator { get; private set; }
  44. internal CommandBufferPool CommandBufferPool { get; private set; }
  45. internal DescriptorSetManager DescriptorSetManager { get; private set; }
  46. internal PipelineLayoutCache PipelineLayoutCache { get; private set; }
  47. internal BackgroundResources BackgroundResources { get; private set; }
  48. internal Action<Action> InterruptAction { get; private set; }
  49. internal SyncManager SyncManager { get; private set; }
  50. internal BufferManager BufferManager { get; private set; }
  51. internal HashSet<ShaderCollection> Shaders { get; }
  52. internal HashSet<ITexture> Textures { get; }
  53. internal HashSet<SamplerHolder> Samplers { get; }
  54. private VulkanDebugMessenger _debugMessenger;
  55. private Counters _counters;
  56. private PipelineFull _pipeline;
  57. internal HelperShader HelperShader { get; private set; }
  58. internal PipelineFull PipelineInternal => _pipeline;
  59. public IPipeline Pipeline => _pipeline;
  60. public IWindow Window => _window;
  61. private readonly Func<Instance, Vk, SurfaceKHR> _getSurface;
  62. private readonly Func<string[]> _getRequiredExtensions;
  63. private readonly string _preferredGpuId;
  64. internal Vendor Vendor { get; private set; }
  65. internal bool IsAmdWindows { get; private set; }
  66. internal bool IsIntelWindows { get; private set; }
  67. internal bool IsAmdGcn { get; private set; }
  68. internal bool IsMoltenVk { get; private set; }
  69. internal bool IsTBDR { get; private set; }
  70. internal bool IsSharedMemory { get; private set; }
  71. public string GpuVendor { get; private set; }
  72. public string GpuRenderer { get; private set; }
  73. public string GpuVersion { get; private set; }
  74. public bool PreferThreading => true;
  75. public event EventHandler<ScreenCaptureImageInfo> ScreenCaptured;
  76. public VulkanRenderer(Vk api, Func<Instance, Vk, SurfaceKHR> surfaceFunc, Func<string[]> requiredExtensionsFunc, string preferredGpuId)
  77. {
  78. _getSurface = surfaceFunc;
  79. _getRequiredExtensions = requiredExtensionsFunc;
  80. _preferredGpuId = preferredGpuId;
  81. Api = api;
  82. Shaders = new HashSet<ShaderCollection>();
  83. Textures = new HashSet<ITexture>();
  84. Samplers = new HashSet<SamplerHolder>();
  85. if (OperatingSystem.IsMacOS())
  86. {
  87. MVKInitialization.Initialize();
  88. // Any device running on MacOS is using MoltenVK, even Intel and AMD vendors.
  89. IsMoltenVk = true;
  90. }
  91. }
  92. private unsafe void LoadFeatures(uint maxQueueCount, uint queueFamilyIndex)
  93. {
  94. FormatCapabilities = new FormatCapabilities(Api, _physicalDevice.PhysicalDevice);
  95. if (Api.TryGetDeviceExtension(_instance.Instance, _device, out ExtConditionalRendering conditionalRenderingApi))
  96. {
  97. ConditionalRenderingApi = conditionalRenderingApi;
  98. }
  99. if (Api.TryGetDeviceExtension(_instance.Instance, _device, out ExtExtendedDynamicState extendedDynamicStateApi))
  100. {
  101. ExtendedDynamicStateApi = extendedDynamicStateApi;
  102. }
  103. if (Api.TryGetDeviceExtension(_instance.Instance, _device, out KhrPushDescriptor pushDescriptorApi))
  104. {
  105. PushDescriptorApi = pushDescriptorApi;
  106. }
  107. if (Api.TryGetDeviceExtension(_instance.Instance, _device, out ExtTransformFeedback transformFeedbackApi))
  108. {
  109. TransformFeedbackApi = transformFeedbackApi;
  110. }
  111. if (Api.TryGetDeviceExtension(_instance.Instance, _device, out KhrDrawIndirectCount drawIndirectCountApi))
  112. {
  113. DrawIndirectCountApi = drawIndirectCountApi;
  114. }
  115. if (maxQueueCount >= 2)
  116. {
  117. Api.GetDeviceQueue(_device, queueFamilyIndex, 1, out var backgroundQueue);
  118. BackgroundQueue = backgroundQueue;
  119. BackgroundQueueLock = new object();
  120. }
  121. PhysicalDeviceProperties2 properties2 = new()
  122. {
  123. SType = StructureType.PhysicalDeviceProperties2,
  124. };
  125. PhysicalDeviceSubgroupProperties propertiesSubgroup = new()
  126. {
  127. SType = StructureType.PhysicalDeviceSubgroupProperties,
  128. PNext = properties2.PNext,
  129. };
  130. properties2.PNext = &propertiesSubgroup;
  131. PhysicalDeviceBlendOperationAdvancedPropertiesEXT propertiesBlendOperationAdvanced = new()
  132. {
  133. SType = StructureType.PhysicalDeviceBlendOperationAdvancedPropertiesExt,
  134. };
  135. bool supportsBlendOperationAdvanced = _physicalDevice.IsDeviceExtensionPresent("VK_EXT_blend_operation_advanced");
  136. if (supportsBlendOperationAdvanced)
  137. {
  138. propertiesBlendOperationAdvanced.PNext = properties2.PNext;
  139. properties2.PNext = &propertiesBlendOperationAdvanced;
  140. }
  141. bool supportsTransformFeedback = _physicalDevice.IsDeviceExtensionPresent(ExtTransformFeedback.ExtensionName);
  142. PhysicalDeviceTransformFeedbackPropertiesEXT propertiesTransformFeedback = new()
  143. {
  144. SType = StructureType.PhysicalDeviceTransformFeedbackPropertiesExt,
  145. };
  146. if (supportsTransformFeedback)
  147. {
  148. propertiesTransformFeedback.PNext = properties2.PNext;
  149. properties2.PNext = &propertiesTransformFeedback;
  150. }
  151. PhysicalDevicePortabilitySubsetPropertiesKHR propertiesPortabilitySubset = new()
  152. {
  153. SType = StructureType.PhysicalDevicePortabilitySubsetPropertiesKhr,
  154. };
  155. PhysicalDeviceFeatures2 features2 = new()
  156. {
  157. SType = StructureType.PhysicalDeviceFeatures2,
  158. };
  159. PhysicalDevicePrimitiveTopologyListRestartFeaturesEXT featuresPrimitiveTopologyListRestart = new()
  160. {
  161. SType = StructureType.PhysicalDevicePrimitiveTopologyListRestartFeaturesExt,
  162. };
  163. PhysicalDeviceRobustness2FeaturesEXT featuresRobustness2 = new()
  164. {
  165. SType = StructureType.PhysicalDeviceRobustness2FeaturesExt,
  166. };
  167. PhysicalDeviceShaderFloat16Int8FeaturesKHR featuresShaderInt8 = new()
  168. {
  169. SType = StructureType.PhysicalDeviceShaderFloat16Int8Features,
  170. };
  171. PhysicalDeviceCustomBorderColorFeaturesEXT featuresCustomBorderColor = new()
  172. {
  173. SType = StructureType.PhysicalDeviceCustomBorderColorFeaturesExt,
  174. };
  175. PhysicalDeviceDepthClipControlFeaturesEXT featuresDepthClipControl = new()
  176. {
  177. SType = StructureType.PhysicalDeviceDepthClipControlFeaturesExt,
  178. };
  179. PhysicalDevicePortabilitySubsetFeaturesKHR featuresPortabilitySubset = new()
  180. {
  181. SType = StructureType.PhysicalDevicePortabilitySubsetFeaturesKhr,
  182. };
  183. if (_physicalDevice.IsDeviceExtensionPresent("VK_EXT_primitive_topology_list_restart"))
  184. {
  185. features2.PNext = &featuresPrimitiveTopologyListRestart;
  186. }
  187. if (_physicalDevice.IsDeviceExtensionPresent("VK_EXT_robustness2"))
  188. {
  189. featuresRobustness2.PNext = features2.PNext;
  190. features2.PNext = &featuresRobustness2;
  191. }
  192. if (_physicalDevice.IsDeviceExtensionPresent("VK_KHR_shader_float16_int8"))
  193. {
  194. featuresShaderInt8.PNext = features2.PNext;
  195. features2.PNext = &featuresShaderInt8;
  196. }
  197. if (_physicalDevice.IsDeviceExtensionPresent("VK_EXT_custom_border_color"))
  198. {
  199. featuresCustomBorderColor.PNext = features2.PNext;
  200. features2.PNext = &featuresCustomBorderColor;
  201. }
  202. bool supportsDepthClipControl = _physicalDevice.IsDeviceExtensionPresent("VK_EXT_depth_clip_control");
  203. if (supportsDepthClipControl)
  204. {
  205. featuresDepthClipControl.PNext = features2.PNext;
  206. features2.PNext = &featuresDepthClipControl;
  207. }
  208. bool usePortability = _physicalDevice.IsDeviceExtensionPresent("VK_KHR_portability_subset");
  209. if (usePortability)
  210. {
  211. propertiesPortabilitySubset.PNext = properties2.PNext;
  212. properties2.PNext = &propertiesPortabilitySubset;
  213. featuresPortabilitySubset.PNext = features2.PNext;
  214. features2.PNext = &featuresPortabilitySubset;
  215. }
  216. Api.GetPhysicalDeviceProperties2(_physicalDevice.PhysicalDevice, &properties2);
  217. Api.GetPhysicalDeviceFeatures2(_physicalDevice.PhysicalDevice, &features2);
  218. var portabilityFlags = PortabilitySubsetFlags.None;
  219. uint vertexBufferAlignment = 1;
  220. if (usePortability)
  221. {
  222. vertexBufferAlignment = propertiesPortabilitySubset.MinVertexInputBindingStrideAlignment;
  223. portabilityFlags |= featuresPortabilitySubset.TriangleFans ? 0 : PortabilitySubsetFlags.NoTriangleFans;
  224. portabilityFlags |= featuresPortabilitySubset.PointPolygons ? 0 : PortabilitySubsetFlags.NoPointMode;
  225. portabilityFlags |= featuresPortabilitySubset.ImageView2DOn3DImage ? 0 : PortabilitySubsetFlags.No3DImageView;
  226. portabilityFlags |= featuresPortabilitySubset.SamplerMipLodBias ? 0 : PortabilitySubsetFlags.NoLodBias;
  227. }
  228. bool supportsCustomBorderColor = _physicalDevice.IsDeviceExtensionPresent("VK_EXT_custom_border_color") &&
  229. featuresCustomBorderColor.CustomBorderColors &&
  230. featuresCustomBorderColor.CustomBorderColorWithoutFormat;
  231. ref var properties = ref properties2.Properties;
  232. ulong minResourceAlignment = Math.Max(
  233. Math.Max(
  234. properties.Limits.MinStorageBufferOffsetAlignment,
  235. properties.Limits.MinUniformBufferOffsetAlignment),
  236. properties.Limits.MinTexelBufferOffsetAlignment
  237. );
  238. SampleCountFlags supportedSampleCounts =
  239. properties.Limits.FramebufferColorSampleCounts &
  240. properties.Limits.FramebufferDepthSampleCounts &
  241. properties.Limits.FramebufferStencilSampleCounts;
  242. Capabilities = new HardwareCapabilities(
  243. _physicalDevice.IsDeviceExtensionPresent("VK_EXT_index_type_uint8"),
  244. supportsCustomBorderColor,
  245. supportsBlendOperationAdvanced,
  246. propertiesBlendOperationAdvanced.AdvancedBlendCorrelatedOverlap,
  247. propertiesBlendOperationAdvanced.AdvancedBlendNonPremultipliedSrcColor,
  248. propertiesBlendOperationAdvanced.AdvancedBlendNonPremultipliedDstColor,
  249. _physicalDevice.IsDeviceExtensionPresent(KhrDrawIndirectCount.ExtensionName),
  250. _physicalDevice.IsDeviceExtensionPresent("VK_EXT_fragment_shader_interlock"),
  251. _physicalDevice.IsDeviceExtensionPresent("VK_NV_geometry_shader_passthrough"),
  252. features2.Features.ShaderFloat64,
  253. featuresShaderInt8.ShaderInt8,
  254. _physicalDevice.IsDeviceExtensionPresent("VK_EXT_shader_stencil_export"),
  255. features2.Features.ShaderStorageImageMultisample,
  256. _physicalDevice.IsDeviceExtensionPresent(ExtConditionalRendering.ExtensionName),
  257. _physicalDevice.IsDeviceExtensionPresent(ExtExtendedDynamicState.ExtensionName),
  258. features2.Features.MultiViewport && !(IsMoltenVk && Vendor == Vendor.Amd), // Workaround for AMD on MoltenVK issue
  259. featuresRobustness2.NullDescriptor || IsMoltenVk,
  260. _physicalDevice.IsDeviceExtensionPresent(KhrPushDescriptor.ExtensionName),
  261. featuresPrimitiveTopologyListRestart.PrimitiveTopologyListRestart,
  262. featuresPrimitiveTopologyListRestart.PrimitiveTopologyPatchListRestart,
  263. supportsTransformFeedback,
  264. propertiesTransformFeedback.TransformFeedbackQueries,
  265. features2.Features.OcclusionQueryPrecise,
  266. _physicalDevice.PhysicalDeviceFeatures.PipelineStatisticsQuery,
  267. _physicalDevice.PhysicalDeviceFeatures.GeometryShader,
  268. _physicalDevice.PhysicalDeviceFeatures.TessellationShader,
  269. _physicalDevice.IsDeviceExtensionPresent("VK_NV_viewport_array2"),
  270. _physicalDevice.IsDeviceExtensionPresent(ExtExternalMemoryHost.ExtensionName),
  271. supportsDepthClipControl && featuresDepthClipControl.DepthClipControl,
  272. propertiesSubgroup.SubgroupSize,
  273. supportedSampleCounts,
  274. portabilityFlags,
  275. vertexBufferAlignment,
  276. properties.Limits.SubTexelPrecisionBits,
  277. minResourceAlignment);
  278. IsSharedMemory = MemoryAllocator.IsDeviceMemoryShared(_physicalDevice);
  279. MemoryAllocator = new MemoryAllocator(Api, _physicalDevice, _device);
  280. Api.TryGetDeviceExtension(_instance.Instance, _device, out ExtExternalMemoryHost hostMemoryApi);
  281. HostMemoryAllocator = new HostMemoryAllocator(MemoryAllocator, Api, hostMemoryApi, _device);
  282. CommandBufferPool = new CommandBufferPool(Api, _device, Queue, QueueLock, queueFamilyIndex);
  283. DescriptorSetManager = new DescriptorSetManager(_device, PipelineBase.DescriptorSetLayouts);
  284. PipelineLayoutCache = new PipelineLayoutCache();
  285. BackgroundResources = new BackgroundResources(this, _device);
  286. BufferManager = new BufferManager(this, _device);
  287. SyncManager = new SyncManager(this, _device);
  288. _pipeline = new PipelineFull(this, _device);
  289. _pipeline.Initialize();
  290. HelperShader = new HelperShader(this, _device);
  291. _counters = new Counters(this, _device, _pipeline);
  292. }
  293. private void SetupContext(GraphicsDebugLevel logLevel)
  294. {
  295. _instance = VulkanInitialization.CreateInstance(Api, logLevel, _getRequiredExtensions());
  296. _debugMessenger = new VulkanDebugMessenger(Api, _instance.Instance, logLevel);
  297. if (Api.TryGetInstanceExtension(_instance.Instance, out KhrSurface surfaceApi))
  298. {
  299. SurfaceApi = surfaceApi;
  300. }
  301. _surface = _getSurface(_instance.Instance, Api);
  302. _physicalDevice = VulkanInitialization.FindSuitablePhysicalDevice(Api, _instance, _surface, _preferredGpuId);
  303. var queueFamilyIndex = VulkanInitialization.FindSuitableQueueFamily(Api, _physicalDevice, _surface, out uint maxQueueCount);
  304. _device = VulkanInitialization.CreateDevice(Api, _physicalDevice, queueFamilyIndex, maxQueueCount);
  305. if (Api.TryGetDeviceExtension(_instance.Instance, _device, out KhrSwapchain swapchainApi))
  306. {
  307. SwapchainApi = swapchainApi;
  308. }
  309. Api.GetDeviceQueue(_device, queueFamilyIndex, 0, out var queue);
  310. Queue = queue;
  311. QueueLock = new object();
  312. LoadFeatures(maxQueueCount, queueFamilyIndex);
  313. _window = new Window(this, _surface, _physicalDevice.PhysicalDevice, _device);
  314. _initialized = true;
  315. }
  316. public BufferHandle CreateBuffer(int size, BufferAccess access)
  317. {
  318. return BufferManager.CreateWithHandle(this, size, access.Convert(), default, access == BufferAccess.Stream);
  319. }
  320. public BufferHandle CreateBuffer(int size, BufferHandle storageHint)
  321. {
  322. return BufferManager.CreateWithHandle(this, size, BufferAllocationType.Auto, storageHint);
  323. }
  324. public BufferHandle CreateBuffer(nint pointer, int size)
  325. {
  326. return BufferManager.CreateHostImported(this, pointer, size);
  327. }
  328. public IProgram CreateProgram(ShaderSource[] sources, ShaderInfo info)
  329. {
  330. bool isCompute = sources.Length == 1 && sources[0].Stage == ShaderStage.Compute;
  331. if (info.State.HasValue || isCompute)
  332. {
  333. return new ShaderCollection(this, _device, sources, info.ResourceLayout, info.State ?? default, info.FromCache);
  334. }
  335. return new ShaderCollection(this, _device, sources, info.ResourceLayout);
  336. }
  337. internal ShaderCollection CreateProgramWithMinimalLayout(ShaderSource[] sources, ResourceLayout resourceLayout, SpecDescription[] specDescription = null)
  338. {
  339. return new ShaderCollection(this, _device, sources, resourceLayout, specDescription, isMinimal: true);
  340. }
  341. public ISampler CreateSampler(SamplerCreateInfo info)
  342. {
  343. return new SamplerHolder(this, _device, info);
  344. }
  345. public ITexture CreateTexture(TextureCreateInfo info)
  346. {
  347. if (info.Target == Target.TextureBuffer)
  348. {
  349. return new TextureBuffer(this, info);
  350. }
  351. return CreateTextureView(info);
  352. }
  353. internal TextureView CreateTextureView(TextureCreateInfo info)
  354. {
  355. // This should be disposed when all views are destroyed.
  356. var storage = CreateTextureStorage(info);
  357. return storage.CreateView(info, 0, 0);
  358. }
  359. internal TextureStorage CreateTextureStorage(TextureCreateInfo info)
  360. {
  361. return new TextureStorage(this, _device, info);
  362. }
  363. public void DeleteBuffer(BufferHandle buffer)
  364. {
  365. BufferManager.Delete(buffer);
  366. }
  367. internal void FlushAllCommands()
  368. {
  369. _pipeline?.FlushCommandsImpl();
  370. }
  371. internal void RegisterFlush()
  372. {
  373. SyncManager.RegisterFlush();
  374. // Periodically free unused regions of the staging buffer to avoid doing it all at once.
  375. BufferManager.StagingBuffer.FreeCompleted();
  376. }
  377. public PinnedSpan<byte> GetBufferData(BufferHandle buffer, int offset, int size)
  378. {
  379. return BufferManager.GetData(buffer, offset, size);
  380. }
  381. public unsafe Capabilities GetCapabilities()
  382. {
  383. FormatFeatureFlags compressedFormatFeatureFlags =
  384. FormatFeatureFlags.SampledImageBit |
  385. FormatFeatureFlags.SampledImageFilterLinearBit |
  386. FormatFeatureFlags.BlitSrcBit |
  387. FormatFeatureFlags.TransferSrcBit |
  388. FormatFeatureFlags.TransferDstBit;
  389. bool supportsBc123CompressionFormat = FormatCapabilities.OptimalFormatsSupport(compressedFormatFeatureFlags,
  390. Format.Bc1RgbaSrgb,
  391. Format.Bc1RgbaUnorm,
  392. Format.Bc2Srgb,
  393. Format.Bc2Unorm,
  394. Format.Bc3Srgb,
  395. Format.Bc3Unorm);
  396. bool supportsBc45CompressionFormat = FormatCapabilities.OptimalFormatsSupport(compressedFormatFeatureFlags,
  397. Format.Bc4Snorm,
  398. Format.Bc4Unorm,
  399. Format.Bc5Snorm,
  400. Format.Bc5Unorm);
  401. bool supportsBc67CompressionFormat = FormatCapabilities.OptimalFormatsSupport(compressedFormatFeatureFlags,
  402. Format.Bc6HSfloat,
  403. Format.Bc6HUfloat,
  404. Format.Bc7Srgb,
  405. Format.Bc7Unorm);
  406. bool supportsEtc2CompressionFormat = FormatCapabilities.OptimalFormatsSupport(compressedFormatFeatureFlags,
  407. Format.Etc2RgbaSrgb,
  408. Format.Etc2RgbaUnorm,
  409. Format.Etc2RgbPtaSrgb,
  410. Format.Etc2RgbPtaUnorm,
  411. Format.Etc2RgbSrgb,
  412. Format.Etc2RgbUnorm);
  413. bool supports5BitComponentFormat = FormatCapabilities.OptimalFormatsSupport(compressedFormatFeatureFlags,
  414. Format.R5G6B5Unorm,
  415. Format.R5G5B5A1Unorm,
  416. Format.R5G5B5X1Unorm,
  417. Format.B5G6R5Unorm,
  418. Format.B5G5R5A1Unorm,
  419. Format.A1B5G5R5Unorm);
  420. bool supportsR4G4B4A4Format = FormatCapabilities.OptimalFormatsSupport(compressedFormatFeatureFlags,
  421. Format.R4G4B4A4Unorm);
  422. bool supportsAstcFormats = FormatCapabilities.OptimalFormatsSupport(compressedFormatFeatureFlags,
  423. Format.Astc4x4Unorm,
  424. Format.Astc5x4Unorm,
  425. Format.Astc5x5Unorm,
  426. Format.Astc6x5Unorm,
  427. Format.Astc6x6Unorm,
  428. Format.Astc8x5Unorm,
  429. Format.Astc8x6Unorm,
  430. Format.Astc8x8Unorm,
  431. Format.Astc10x5Unorm,
  432. Format.Astc10x6Unorm,
  433. Format.Astc10x8Unorm,
  434. Format.Astc10x10Unorm,
  435. Format.Astc12x10Unorm,
  436. Format.Astc12x12Unorm,
  437. Format.Astc4x4Srgb,
  438. Format.Astc5x4Srgb,
  439. Format.Astc5x5Srgb,
  440. Format.Astc6x5Srgb,
  441. Format.Astc6x6Srgb,
  442. Format.Astc8x5Srgb,
  443. Format.Astc8x6Srgb,
  444. Format.Astc8x8Srgb,
  445. Format.Astc10x5Srgb,
  446. Format.Astc10x6Srgb,
  447. Format.Astc10x8Srgb,
  448. Format.Astc10x10Srgb,
  449. Format.Astc12x10Srgb,
  450. Format.Astc12x12Srgb);
  451. PhysicalDeviceVulkan12Features featuresVk12 = new()
  452. {
  453. SType = StructureType.PhysicalDeviceVulkan12Features,
  454. };
  455. PhysicalDeviceFeatures2 features2 = new()
  456. {
  457. SType = StructureType.PhysicalDeviceFeatures2,
  458. PNext = &featuresVk12,
  459. };
  460. Api.GetPhysicalDeviceFeatures2(_physicalDevice.PhysicalDevice, &features2);
  461. var limits = _physicalDevice.PhysicalDeviceProperties.Limits;
  462. return new Capabilities(
  463. api: TargetApi.Vulkan,
  464. GpuVendor,
  465. hasFrontFacingBug: IsIntelWindows,
  466. hasVectorIndexingBug: Vendor == Vendor.Qualcomm,
  467. needsFragmentOutputSpecialization: IsMoltenVk,
  468. reduceShaderPrecision: IsMoltenVk,
  469. supportsAstcCompression: features2.Features.TextureCompressionAstcLdr && supportsAstcFormats,
  470. supportsBc123Compression: supportsBc123CompressionFormat,
  471. supportsBc45Compression: supportsBc45CompressionFormat,
  472. supportsBc67Compression: supportsBc67CompressionFormat,
  473. supportsEtc2Compression: supportsEtc2CompressionFormat,
  474. supports3DTextureCompression: true,
  475. supportsBgraFormat: true,
  476. supportsR4G4Format: false,
  477. supportsR4G4B4A4Format: supportsR4G4B4A4Format,
  478. supportsSnormBufferTextureFormat: true,
  479. supports5BitComponentFormat: supports5BitComponentFormat,
  480. supportsBlendEquationAdvanced: Capabilities.SupportsBlendEquationAdvanced,
  481. supportsFragmentShaderInterlock: Capabilities.SupportsFragmentShaderInterlock,
  482. supportsFragmentShaderOrderingIntel: false,
  483. supportsGeometryShader: Capabilities.SupportsGeometryShader,
  484. supportsGeometryShaderPassthrough: Capabilities.SupportsGeometryShaderPassthrough,
  485. supportsTransformFeedback: Capabilities.SupportsTransformFeedback,
  486. supportsImageLoadFormatted: features2.Features.ShaderStorageImageReadWithoutFormat,
  487. supportsLayerVertexTessellation: featuresVk12.ShaderOutputLayer,
  488. supportsMismatchingViewFormat: true,
  489. supportsCubemapView: !IsAmdGcn,
  490. supportsNonConstantTextureOffset: false,
  491. supportsScaledVertexFormats: FormatCapabilities.SupportsScaledVertexFormats(),
  492. supportsShaderBallot: false,
  493. supportsShaderBarrierDivergence: Vendor != Vendor.Intel,
  494. supportsShaderFloat64: Capabilities.SupportsShaderFloat64,
  495. supportsTextureShadowLod: false,
  496. supportsVertexStoreAndAtomics: features2.Features.VertexPipelineStoresAndAtomics,
  497. supportsViewportIndexVertexTessellation: featuresVk12.ShaderOutputViewportIndex,
  498. supportsViewportMask: Capabilities.SupportsViewportArray2,
  499. supportsViewportSwizzle: false,
  500. supportsIndirectParameters: true,
  501. supportsDepthClipControl: Capabilities.SupportsDepthClipControl,
  502. maximumUniformBuffersPerStage: Constants.MaxUniformBuffersPerStage,
  503. maximumStorageBuffersPerStage: Constants.MaxStorageBuffersPerStage,
  504. maximumTexturesPerStage: Constants.MaxTexturesPerStage,
  505. maximumImagesPerStage: Constants.MaxImagesPerStage,
  506. maximumComputeSharedMemorySize: (int)limits.MaxComputeSharedMemorySize,
  507. maximumSupportedAnisotropy: (int)limits.MaxSamplerAnisotropy,
  508. shaderSubgroupSize: (int)Capabilities.SubgroupSize,
  509. storageBufferOffsetAlignment: (int)limits.MinStorageBufferOffsetAlignment,
  510. textureBufferOffsetAlignment: (int)limits.MinTexelBufferOffsetAlignment,
  511. gatherBiasPrecision: IsIntelWindows || IsAmdWindows ? (int)Capabilities.SubTexelPrecisionBits : 0);
  512. }
  513. public HardwareInfo GetHardwareInfo()
  514. {
  515. return new HardwareInfo(GpuVendor, GpuRenderer);
  516. }
  517. /// <summary>
  518. /// Gets the available Vulkan devices using the default Vulkan API
  519. /// object returned by <see cref="Vk.GetApi()"/>
  520. /// </summary>
  521. /// <returns></returns>
  522. public static DeviceInfo[] GetPhysicalDevices()
  523. {
  524. try
  525. {
  526. return VulkanInitialization.GetSuitablePhysicalDevices(Vk.GetApi());
  527. }
  528. catch (Exception ex)
  529. {
  530. Logger.Error?.PrintMsg(LogClass.Gpu, $"Error querying Vulkan devices: {ex.Message}");
  531. return Array.Empty<DeviceInfo>();
  532. }
  533. }
  534. public static DeviceInfo[] GetPhysicalDevices(Vk api)
  535. {
  536. try
  537. {
  538. return VulkanInitialization.GetSuitablePhysicalDevices(api);
  539. }
  540. catch (Exception)
  541. {
  542. // If we got an exception here, Vulkan is most likely not supported.
  543. return Array.Empty<DeviceInfo>();
  544. }
  545. }
  546. private static string ParseStandardVulkanVersion(uint version)
  547. {
  548. return $"{version >> 22}.{(version >> 12) & 0x3FF}.{version & 0xFFF}";
  549. }
  550. private static string ParseDriverVersion(ref PhysicalDeviceProperties properties)
  551. {
  552. uint driverVersionRaw = properties.DriverVersion;
  553. // NVIDIA differ from the standard here and uses a different format.
  554. if (properties.VendorID == 0x10DE)
  555. {
  556. return $"{(driverVersionRaw >> 22) & 0x3FF}.{(driverVersionRaw >> 14) & 0xFF}.{(driverVersionRaw >> 6) & 0xFF}.{driverVersionRaw & 0x3F}";
  557. }
  558. return ParseStandardVulkanVersion(driverVersionRaw);
  559. }
  560. private unsafe void PrintGpuInformation()
  561. {
  562. var properties = _physicalDevice.PhysicalDeviceProperties;
  563. string vendorName = VendorUtils.GetNameFromId(properties.VendorID);
  564. Vendor = VendorUtils.FromId(properties.VendorID);
  565. IsAmdWindows = Vendor == Vendor.Amd && OperatingSystem.IsWindows();
  566. IsIntelWindows = Vendor == Vendor.Intel && OperatingSystem.IsWindows();
  567. IsTBDR =
  568. Vendor == Vendor.Apple ||
  569. Vendor == Vendor.Qualcomm ||
  570. Vendor == Vendor.ARM ||
  571. Vendor == Vendor.Broadcom ||
  572. Vendor == Vendor.ImgTec;
  573. GpuVendor = vendorName;
  574. GpuRenderer = Marshal.PtrToStringAnsi((IntPtr)properties.DeviceName);
  575. GpuVersion = $"Vulkan v{ParseStandardVulkanVersion(properties.ApiVersion)}, Driver v{ParseDriverVersion(ref properties)}";
  576. IsAmdGcn = !IsMoltenVk && Vendor == Vendor.Amd && VendorUtils.AmdGcnRegex().IsMatch(GpuRenderer);
  577. Logger.Notice.Print(LogClass.Gpu, $"{GpuVendor} {GpuRenderer} ({GpuVersion})");
  578. }
  579. internal PrimitiveTopology TopologyRemap(PrimitiveTopology topology)
  580. {
  581. return topology switch
  582. {
  583. PrimitiveTopology.Quads => PrimitiveTopology.Triangles,
  584. PrimitiveTopology.QuadStrip => PrimitiveTopology.TriangleStrip,
  585. PrimitiveTopology.TriangleFan => Capabilities.PortabilitySubset.HasFlag(PortabilitySubsetFlags.NoTriangleFans) ? PrimitiveTopology.Triangles : topology,
  586. _ => topology,
  587. };
  588. }
  589. internal bool TopologyUnsupported(PrimitiveTopology topology)
  590. {
  591. return topology switch
  592. {
  593. PrimitiveTopology.Quads => true,
  594. PrimitiveTopology.TriangleFan => Capabilities.PortabilitySubset.HasFlag(PortabilitySubsetFlags.NoTriangleFans),
  595. _ => false,
  596. };
  597. }
  598. public void Initialize(GraphicsDebugLevel logLevel)
  599. {
  600. SetupContext(logLevel);
  601. PrintGpuInformation();
  602. }
  603. internal bool NeedsVertexBufferAlignment(int attrScalarAlignment, out int alignment)
  604. {
  605. if (Capabilities.VertexBufferAlignment > 1)
  606. {
  607. alignment = (int)Capabilities.VertexBufferAlignment;
  608. return true;
  609. }
  610. else if (Vendor != Vendor.Nvidia)
  611. {
  612. // Vulkan requires that vertex attributes are globally aligned by their component size,
  613. // so buffer strides that don't divide by the largest scalar element are invalid.
  614. // Guest applications do this, NVIDIA GPUs are OK with it, others are not.
  615. alignment = attrScalarAlignment;
  616. return true;
  617. }
  618. alignment = 1;
  619. return false;
  620. }
  621. public void PreFrame()
  622. {
  623. SyncManager.Cleanup();
  624. }
  625. public ICounterEvent ReportCounter(CounterType type, EventHandler<ulong> resultHandler, float divisor, bool hostReserved)
  626. {
  627. return _counters.QueueReport(type, resultHandler, divisor, hostReserved);
  628. }
  629. public void ResetCounter(CounterType type)
  630. {
  631. _counters.QueueReset(type);
  632. }
  633. public void SetBufferData(BufferHandle buffer, int offset, ReadOnlySpan<byte> data)
  634. {
  635. BufferManager.SetData(buffer, offset, data, _pipeline.CurrentCommandBuffer, _pipeline.EndRenderPass);
  636. }
  637. public void UpdateCounters()
  638. {
  639. _counters.Update();
  640. }
  641. public void ResetCounterPool()
  642. {
  643. _counters.ResetCounterPool();
  644. }
  645. public void ResetFutureCounters(CommandBuffer cmd, int count)
  646. {
  647. _counters?.ResetFutureCounters(cmd, count);
  648. }
  649. public void BackgroundContextAction(Action action, bool alwaysBackground = false)
  650. {
  651. action();
  652. }
  653. public void CreateSync(ulong id, bool strict)
  654. {
  655. SyncManager.Create(id, strict);
  656. }
  657. public IProgram LoadProgramBinary(byte[] programBinary, bool isFragment, ShaderInfo info)
  658. {
  659. throw new NotImplementedException();
  660. }
  661. public void WaitSync(ulong id)
  662. {
  663. SyncManager.Wait(id);
  664. }
  665. public ulong GetCurrentSync()
  666. {
  667. return SyncManager.GetCurrent();
  668. }
  669. public void SetInterruptAction(Action<Action> interruptAction)
  670. {
  671. InterruptAction = interruptAction;
  672. }
  673. public void Screenshot()
  674. {
  675. _window.ScreenCaptureRequested = true;
  676. }
  677. public void OnScreenCaptured(ScreenCaptureImageInfo bitmap)
  678. {
  679. ScreenCaptured?.Invoke(this, bitmap);
  680. }
  681. public unsafe void Dispose()
  682. {
  683. if (!_initialized)
  684. {
  685. return;
  686. }
  687. CommandBufferPool.Dispose();
  688. BackgroundResources.Dispose();
  689. _counters.Dispose();
  690. _window.Dispose();
  691. HelperShader.Dispose();
  692. _pipeline.Dispose();
  693. BufferManager.Dispose();
  694. DescriptorSetManager.Dispose();
  695. PipelineLayoutCache.Dispose();
  696. MemoryAllocator.Dispose();
  697. foreach (var shader in Shaders)
  698. {
  699. shader.Dispose();
  700. }
  701. foreach (var texture in Textures)
  702. {
  703. texture.Release();
  704. }
  705. foreach (var sampler in Samplers)
  706. {
  707. sampler.Dispose();
  708. }
  709. SurfaceApi.DestroySurface(_instance.Instance, _surface, null);
  710. Api.DestroyDevice(_device, null);
  711. _debugMessenger.Dispose();
  712. // Last step destroy the instance
  713. _instance.Dispose();
  714. }
  715. public bool PrepareHostMapping(nint address, ulong size)
  716. {
  717. return Capabilities.SupportsHostImportedMemory &&
  718. HostMemoryAllocator.TryImport(BufferManager.HostImportedBufferMemoryRequirements, BufferManager.DefaultBufferMemoryFlags, address, size);
  719. }
  720. }
  721. }