MethodCopyBuffer.cs 9.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224
  1. using Ryujinx.Common;
  2. using Ryujinx.Graphics.Gpu.State;
  3. using Ryujinx.Graphics.Texture;
  4. using System;
  5. using System.Runtime.Intrinsics;
  6. namespace Ryujinx.Graphics.Gpu.Engine
  7. {
  8. partial class Methods
  9. {
  10. private const int StrideAlignment = 32;
  11. private const int GobAlignment = 64;
  12. enum CopyFlags
  13. {
  14. SrcLinear = 1 << 7,
  15. DstLinear = 1 << 8,
  16. MultiLineEnable = 1 << 9,
  17. RemapEnable = 1 << 10
  18. }
  19. /// <summary>
  20. /// Determine if a buffer-to-texture region covers the entirety of a texture.
  21. /// </summary>
  22. /// <param name="cbp">Copy command parameters</param>
  23. /// <param name="tex">Texture to compare</param>
  24. /// <param name="linear">True if the texture is linear, false if block linear</param>
  25. /// <param name="bpp">Texture bytes per pixel</param>
  26. /// <param name="stride">Texture stride</param>
  27. /// <returns></returns>
  28. private bool IsTextureCopyComplete(CopyBufferParams cbp, CopyBufferTexture tex, bool linear, int bpp, int stride)
  29. {
  30. if (linear)
  31. {
  32. int alignWidth = StrideAlignment / bpp;
  33. return tex.RegionX == 0 &&
  34. tex.RegionY == 0 &&
  35. stride / bpp == BitUtils.AlignUp(cbp.XCount, alignWidth);
  36. }
  37. else
  38. {
  39. int alignWidth = GobAlignment / bpp;
  40. return tex.RegionX == 0 &&
  41. tex.RegionY == 0 &&
  42. tex.Width == BitUtils.AlignUp(cbp.XCount, alignWidth) &&
  43. tex.Height == cbp.YCount;
  44. }
  45. }
  46. /// <summary>
  47. /// Performs a buffer to buffer, or buffer to texture copy.
  48. /// </summary>
  49. /// <param name="state">Current GPU state</param>
  50. /// <param name="argument">Method call argument</param>
  51. private void CopyBuffer(GpuState state, int argument)
  52. {
  53. var cbp = state.Get<CopyBufferParams>(MethodOffset.CopyBufferParams);
  54. var swizzle = state.Get<CopyBufferSwizzle>(MethodOffset.CopyBufferSwizzle);
  55. CopyFlags copyFlags = (CopyFlags)argument;
  56. bool srcLinear = copyFlags.HasFlag(CopyFlags.SrcLinear);
  57. bool dstLinear = copyFlags.HasFlag(CopyFlags.DstLinear);
  58. bool copy2D = copyFlags.HasFlag(CopyFlags.MultiLineEnable);
  59. bool remap = copyFlags.HasFlag(CopyFlags.RemapEnable);
  60. int size = cbp.XCount;
  61. if (size == 0)
  62. {
  63. return;
  64. }
  65. if (copy2D)
  66. {
  67. // Buffer to texture copy.
  68. int srcBpp = remap ? swizzle.UnpackSrcComponentsCount() * swizzle.UnpackComponentSize() : 1;
  69. int dstBpp = remap ? swizzle.UnpackDstComponentsCount() * swizzle.UnpackComponentSize() : 1;
  70. var dst = state.Get<CopyBufferTexture>(MethodOffset.CopyBufferDstTexture);
  71. var src = state.Get<CopyBufferTexture>(MethodOffset.CopyBufferSrcTexture);
  72. var srcCalculator = new OffsetCalculator(
  73. src.Width,
  74. src.Height,
  75. cbp.SrcStride,
  76. srcLinear,
  77. src.MemoryLayout.UnpackGobBlocksInY(),
  78. src.MemoryLayout.UnpackGobBlocksInZ(),
  79. srcBpp);
  80. var dstCalculator = new OffsetCalculator(
  81. dst.Width,
  82. dst.Height,
  83. cbp.DstStride,
  84. dstLinear,
  85. dst.MemoryLayout.UnpackGobBlocksInY(),
  86. dst.MemoryLayout.UnpackGobBlocksInZ(),
  87. dstBpp);
  88. ulong srcBaseAddress = _context.MemoryManager.Translate(cbp.SrcAddress.Pack());
  89. ulong dstBaseAddress = _context.MemoryManager.Translate(cbp.DstAddress.Pack());
  90. (int srcBaseOffset, int srcSize) = srcCalculator.GetRectangleRange(src.RegionX, src.RegionY, cbp.XCount, cbp.YCount);
  91. (int dstBaseOffset, int dstSize) = dstCalculator.GetRectangleRange(dst.RegionX, dst.RegionY, cbp.XCount, cbp.YCount);
  92. ReadOnlySpan<byte> srcSpan = _context.PhysicalMemory.GetSpan(srcBaseAddress + (ulong)srcBaseOffset, srcSize, true);
  93. Span<byte> dstSpan = _context.PhysicalMemory.GetSpan(dstBaseAddress + (ulong)dstBaseOffset, dstSize).ToArray();
  94. bool completeSource = IsTextureCopyComplete(cbp, src, srcLinear, srcBpp, cbp.SrcStride);
  95. bool completeDest = IsTextureCopyComplete(cbp, dst, dstLinear, dstBpp, cbp.DstStride);
  96. if (completeSource && completeDest)
  97. {
  98. Image.Texture target = TextureManager.FindTexture(dst, cbp, swizzle, dstLinear);
  99. if (target != null)
  100. {
  101. ReadOnlySpan<byte> data;
  102. if (srcLinear)
  103. {
  104. data = LayoutConverter.ConvertLinearStridedToLinear(
  105. target.Info.Width,
  106. target.Info.Height,
  107. 1,
  108. 1,
  109. cbp.SrcStride,
  110. target.Info.FormatInfo.BytesPerPixel,
  111. srcSpan);
  112. }
  113. else
  114. {
  115. data = LayoutConverter.ConvertBlockLinearToLinear(
  116. src.Width,
  117. src.Height,
  118. 1,
  119. target.Info.Levels,
  120. 1,
  121. 1,
  122. 1,
  123. srcBpp,
  124. src.MemoryLayout.UnpackGobBlocksInY(),
  125. src.MemoryLayout.UnpackGobBlocksInZ(),
  126. 1,
  127. new SizeInfo((int)target.Size),
  128. srcSpan);
  129. }
  130. target.SetData(data);
  131. target.SignalModified();
  132. return;
  133. }
  134. else if (srcCalculator.LayoutMatches(dstCalculator))
  135. {
  136. srcSpan.CopyTo(dstSpan); // No layout conversion has to be performed, just copy the data entirely.
  137. _context.PhysicalMemory.Write(dstBaseAddress + (ulong)dstBaseOffset, dstSpan);
  138. return;
  139. }
  140. }
  141. unsafe bool Convert<T>(Span<byte> dstSpan, ReadOnlySpan<byte> srcSpan) where T : unmanaged
  142. {
  143. fixed (byte* dstPtr = dstSpan, srcPtr = srcSpan)
  144. {
  145. byte* dstBase = dstPtr - dstBaseOffset; // Layout offset is relative to the base, so we need to subtract the span's offset.
  146. byte* srcBase = srcPtr - srcBaseOffset;
  147. for (int y = 0; y < cbp.YCount; y++)
  148. {
  149. srcCalculator.SetY(src.RegionY + y);
  150. dstCalculator.SetY(dst.RegionY + y);
  151. for (int x = 0; x < cbp.XCount; x++)
  152. {
  153. int srcOffset = srcCalculator.GetOffset(src.RegionX + x);
  154. int dstOffset = dstCalculator.GetOffset(dst.RegionX + x);
  155. *(T*)(dstBase + dstOffset) = *(T*)(srcBase + srcOffset);
  156. }
  157. }
  158. }
  159. return true;
  160. }
  161. bool _ = srcBpp switch
  162. {
  163. 1 => Convert<byte>(dstSpan, srcSpan),
  164. 2 => Convert<ushort>(dstSpan, srcSpan),
  165. 4 => Convert<uint>(dstSpan, srcSpan),
  166. 8 => Convert<ulong>(dstSpan, srcSpan),
  167. 12 => Convert<Bpp12Pixel>(dstSpan, srcSpan),
  168. 16 => Convert<Vector128<byte>>(dstSpan, srcSpan),
  169. _ => throw new NotSupportedException($"Unable to copy ${srcBpp} bpp pixel format.")
  170. };
  171. _context.PhysicalMemory.Write(dstBaseAddress + (ulong)dstBaseOffset, dstSpan);
  172. }
  173. else
  174. {
  175. if (remap &&
  176. swizzle.UnpackDstX() == BufferSwizzleComponent.ConstA &&
  177. swizzle.UnpackDstY() == BufferSwizzleComponent.ConstA &&
  178. swizzle.UnpackDstZ() == BufferSwizzleComponent.ConstA &&
  179. swizzle.UnpackDstW() == BufferSwizzleComponent.ConstA &&
  180. swizzle.UnpackSrcComponentsCount() == 1 &&
  181. swizzle.UnpackDstComponentsCount() == 1 &&
  182. swizzle.UnpackComponentSize() == 4)
  183. {
  184. // Fast path for clears when remap is enabled.
  185. BufferManager.ClearBuffer(cbp.DstAddress, (uint)size * 4, state.Get<uint>(MethodOffset.CopyBufferConstA));
  186. }
  187. else
  188. {
  189. // TODO: Implement remap functionality.
  190. // Buffer to buffer copy.
  191. BufferManager.CopyBuffer(cbp.SrcAddress, cbp.DstAddress, (uint)size);
  192. }
  193. }
  194. }
  195. }
  196. }