InstEmitTexture.cs 43 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399
  1. using Ryujinx.Graphics.Shader.Decoders;
  2. using Ryujinx.Graphics.Shader.IntermediateRepresentation;
  3. using Ryujinx.Graphics.Shader.Translation;
  4. using System;
  5. using System.Collections.Generic;
  6. using static Ryujinx.Graphics.Shader.Instructions.InstEmitHelper;
  7. using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
  8. namespace Ryujinx.Graphics.Shader.Instructions
  9. {
  10. static partial class InstEmit
  11. {
  12. public static void Suld(EmitterContext context)
  13. {
  14. OpCodeImage op = (OpCodeImage)context.CurrOp;
  15. SamplerType type = ConvertSamplerType(op.Dimensions);
  16. if (type == SamplerType.None)
  17. {
  18. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  19. return;
  20. }
  21. // Rb is Rd on the SULD instruction.
  22. int rdIndex = op.Rb.Index;
  23. int raIndex = op.Ra.Index;
  24. Operand Ra()
  25. {
  26. if (raIndex > RegisterConsts.RegisterZeroIndex)
  27. {
  28. return Const(0);
  29. }
  30. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  31. }
  32. bool isArray = op.Dimensions == ImageDimensions.Image1DArray ||
  33. op.Dimensions == ImageDimensions.Image2DArray;
  34. Operand arrayIndex = isArray ? Ra() : null;
  35. List<Operand> sourcesList = new List<Operand>();
  36. if (op.IsBindless)
  37. {
  38. sourcesList.Add(context.Copy(Register(op.Rc)));
  39. }
  40. int coordsCount = type.GetDimensions();
  41. for (int index = 0; index < coordsCount; index++)
  42. {
  43. sourcesList.Add(Ra());
  44. }
  45. if (isArray)
  46. {
  47. sourcesList.Add(arrayIndex);
  48. type |= SamplerType.Array;
  49. }
  50. Operand[] sources = sourcesList.ToArray();
  51. int handle = !op.IsBindless ? op.Immediate : 0;
  52. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  53. if (op.UseComponents)
  54. {
  55. int componentMask = (int)op.Components;
  56. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  57. {
  58. if ((compMask & 1) == 0)
  59. {
  60. continue;
  61. }
  62. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  63. {
  64. break;
  65. }
  66. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  67. TextureOperation operation = new TextureOperation(
  68. Instruction.ImageLoad,
  69. type,
  70. flags,
  71. handle,
  72. compIndex,
  73. rd,
  74. sources);
  75. if (!op.IsBindless)
  76. {
  77. operation.Format = GetTextureFormat(context, handle);
  78. }
  79. context.Add(operation);
  80. }
  81. }
  82. else
  83. {
  84. if (op.ByteAddress)
  85. {
  86. int xIndex = op.IsBindless ? 1 : 0;
  87. sources[xIndex] = context.ShiftRightS32(sources[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  88. }
  89. int components = GetComponents(op.Size);
  90. for (int compIndex = 0; compIndex < components; compIndex++)
  91. {
  92. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  93. {
  94. break;
  95. }
  96. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  97. TextureOperation operation = new TextureOperation(
  98. Instruction.ImageLoad,
  99. type,
  100. flags,
  101. handle,
  102. compIndex,
  103. rd,
  104. sources)
  105. {
  106. Format = GetTextureFormat(op.Size)
  107. };
  108. context.Add(operation);
  109. switch (op.Size)
  110. {
  111. case IntegerSize.U8: context.Copy(rd, ZeroExtendTo32(context, rd, 8)); break;
  112. case IntegerSize.U16: context.Copy(rd, ZeroExtendTo32(context, rd, 16)); break;
  113. case IntegerSize.S8: context.Copy(rd, SignExtendTo32(context, rd, 8)); break;
  114. case IntegerSize.S16: context.Copy(rd, SignExtendTo32(context, rd, 16)); break;
  115. }
  116. }
  117. }
  118. }
  119. public static void Sust(EmitterContext context)
  120. {
  121. OpCodeImage op = (OpCodeImage)context.CurrOp;
  122. SamplerType type = ConvertSamplerType(op.Dimensions);
  123. if (type == SamplerType.None)
  124. {
  125. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  126. return;
  127. }
  128. int raIndex = op.Ra.Index;
  129. int rbIndex = op.Rb.Index;
  130. Operand Ra()
  131. {
  132. if (raIndex > RegisterConsts.RegisterZeroIndex)
  133. {
  134. return Const(0);
  135. }
  136. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  137. }
  138. Operand Rb()
  139. {
  140. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  141. {
  142. return Const(0);
  143. }
  144. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  145. }
  146. bool isArray = op.Dimensions == ImageDimensions.Image1DArray ||
  147. op.Dimensions == ImageDimensions.Image2DArray;
  148. Operand arrayIndex = isArray ? Ra() : null;
  149. List<Operand> sourcesList = new List<Operand>();
  150. if (op.IsBindless)
  151. {
  152. sourcesList.Add(context.Copy(Register(op.Rc)));
  153. }
  154. int coordsCount = type.GetDimensions();
  155. for (int index = 0; index < coordsCount; index++)
  156. {
  157. sourcesList.Add(Ra());
  158. }
  159. if (isArray)
  160. {
  161. sourcesList.Add(arrayIndex);
  162. type |= SamplerType.Array;
  163. }
  164. TextureFormat format = TextureFormat.Unknown;
  165. if (op.UseComponents)
  166. {
  167. int componentMask = (int)op.Components;
  168. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  169. {
  170. if ((compMask & 1) != 0)
  171. {
  172. sourcesList.Add(Rb());
  173. }
  174. }
  175. if (!op.IsBindless)
  176. {
  177. format = GetTextureFormat(context, op.Immediate);
  178. }
  179. }
  180. else
  181. {
  182. if (op.ByteAddress)
  183. {
  184. int xIndex = op.IsBindless ? 1 : 0;
  185. sourcesList[xIndex] = context.ShiftRightS32(sourcesList[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  186. }
  187. int components = GetComponents(op.Size);
  188. for (int compIndex = 0; compIndex < components; compIndex++)
  189. {
  190. sourcesList.Add(Rb());
  191. }
  192. format = GetTextureFormat(op.Size);
  193. }
  194. Operand[] sources = sourcesList.ToArray();
  195. int handle = !op.IsBindless ? op.Immediate : 0;
  196. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  197. TextureOperation operation = new TextureOperation(
  198. Instruction.ImageStore,
  199. type,
  200. flags,
  201. handle,
  202. 0,
  203. null,
  204. sources)
  205. {
  206. Format = format
  207. };
  208. context.Add(operation);
  209. }
  210. public static void Tex(EmitterContext context)
  211. {
  212. EmitTextureSample(context, TextureFlags.None);
  213. }
  214. public static void TexB(EmitterContext context)
  215. {
  216. EmitTextureSample(context, TextureFlags.Bindless);
  217. }
  218. public static void Tld(EmitterContext context)
  219. {
  220. EmitTextureSample(context, TextureFlags.IntCoords);
  221. }
  222. public static void TldB(EmitterContext context)
  223. {
  224. EmitTextureSample(context, TextureFlags.IntCoords | TextureFlags.Bindless);
  225. }
  226. public static void Texs(EmitterContext context)
  227. {
  228. OpCodeTextureScalar op = (OpCodeTextureScalar)context.CurrOp;
  229. if (op.Rd0.IsRZ && op.Rd1.IsRZ)
  230. {
  231. return;
  232. }
  233. List<Operand> sourcesList = new List<Operand>();
  234. int raIndex = op.Ra.Index;
  235. int rbIndex = op.Rb.Index;
  236. Operand Ra()
  237. {
  238. if (raIndex > RegisterConsts.RegisterZeroIndex)
  239. {
  240. return Const(0);
  241. }
  242. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  243. }
  244. Operand Rb()
  245. {
  246. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  247. {
  248. return Const(0);
  249. }
  250. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  251. }
  252. void AddTextureOffset(int coordsCount, int stride, int size)
  253. {
  254. Operand packedOffs = Rb();
  255. for (int index = 0; index < coordsCount; index++)
  256. {
  257. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * stride), Const(size)));
  258. }
  259. }
  260. SamplerType type;
  261. TextureFlags flags;
  262. if (op is OpCodeTexs texsOp)
  263. {
  264. type = ConvertSamplerType(texsOp.Target);
  265. if (type == SamplerType.None)
  266. {
  267. context.Config.GpuAccessor.Log("Invalid texture sampler type.");
  268. return;
  269. }
  270. flags = ConvertTextureFlags(texsOp.Target);
  271. if ((type & SamplerType.Array) != 0)
  272. {
  273. Operand arrayIndex = Ra();
  274. sourcesList.Add(Ra());
  275. sourcesList.Add(Rb());
  276. sourcesList.Add(arrayIndex);
  277. if ((type & SamplerType.Shadow) != 0)
  278. {
  279. sourcesList.Add(Rb());
  280. }
  281. if ((flags & TextureFlags.LodLevel) != 0)
  282. {
  283. sourcesList.Add(ConstF(0));
  284. }
  285. }
  286. else
  287. {
  288. switch (texsOp.Target)
  289. {
  290. case TextureTarget.Texture1DLodZero:
  291. sourcesList.Add(Ra());
  292. sourcesList.Add(ConstF(0));
  293. break;
  294. case TextureTarget.Texture2D:
  295. sourcesList.Add(Ra());
  296. sourcesList.Add(Rb());
  297. break;
  298. case TextureTarget.Texture2DLodZero:
  299. sourcesList.Add(Ra());
  300. sourcesList.Add(Rb());
  301. sourcesList.Add(ConstF(0));
  302. break;
  303. case TextureTarget.Texture2DLodLevel:
  304. case TextureTarget.Texture2DDepthCompare:
  305. case TextureTarget.Texture3D:
  306. case TextureTarget.TextureCube:
  307. sourcesList.Add(Ra());
  308. sourcesList.Add(Ra());
  309. sourcesList.Add(Rb());
  310. break;
  311. case TextureTarget.Texture2DLodZeroDepthCompare:
  312. case TextureTarget.Texture3DLodZero:
  313. sourcesList.Add(Ra());
  314. sourcesList.Add(Ra());
  315. sourcesList.Add(Rb());
  316. sourcesList.Add(ConstF(0));
  317. break;
  318. case TextureTarget.Texture2DLodLevelDepthCompare:
  319. case TextureTarget.TextureCubeLodLevel:
  320. sourcesList.Add(Ra());
  321. sourcesList.Add(Ra());
  322. sourcesList.Add(Rb());
  323. sourcesList.Add(Rb());
  324. break;
  325. }
  326. }
  327. }
  328. else if (op is OpCodeTlds tldsOp)
  329. {
  330. type = ConvertSamplerType (tldsOp.Target);
  331. if (type == SamplerType.None)
  332. {
  333. context.Config.GpuAccessor.Log("Invalid texel fetch sampler type.");
  334. return;
  335. }
  336. flags = ConvertTextureFlags(tldsOp.Target) | TextureFlags.IntCoords;
  337. if (tldsOp.Target == TexelLoadTarget.Texture1DLodZero && context.Config.GpuAccessor.QueryIsTextureBuffer(tldsOp.Immediate))
  338. {
  339. type = SamplerType.TextureBuffer;
  340. flags &= ~TextureFlags.LodLevel;
  341. }
  342. switch (tldsOp.Target)
  343. {
  344. case TexelLoadTarget.Texture1DLodZero:
  345. sourcesList.Add(Ra());
  346. if (type != SamplerType.TextureBuffer)
  347. {
  348. sourcesList.Add(Const(0));
  349. }
  350. break;
  351. case TexelLoadTarget.Texture1DLodLevel:
  352. sourcesList.Add(Ra());
  353. sourcesList.Add(Rb());
  354. break;
  355. case TexelLoadTarget.Texture2DLodZero:
  356. sourcesList.Add(Ra());
  357. sourcesList.Add(Rb());
  358. sourcesList.Add(Const(0));
  359. break;
  360. case TexelLoadTarget.Texture2DLodZeroOffset:
  361. sourcesList.Add(Ra());
  362. sourcesList.Add(Ra());
  363. sourcesList.Add(Const(0));
  364. break;
  365. case TexelLoadTarget.Texture2DLodZeroMultisample:
  366. case TexelLoadTarget.Texture2DLodLevel:
  367. case TexelLoadTarget.Texture2DLodLevelOffset:
  368. sourcesList.Add(Ra());
  369. sourcesList.Add(Ra());
  370. sourcesList.Add(Rb());
  371. break;
  372. case TexelLoadTarget.Texture3DLodZero:
  373. sourcesList.Add(Ra());
  374. sourcesList.Add(Ra());
  375. sourcesList.Add(Rb());
  376. sourcesList.Add(Const(0));
  377. break;
  378. case TexelLoadTarget.Texture2DArrayLodZero:
  379. sourcesList.Add(Rb());
  380. sourcesList.Add(Rb());
  381. sourcesList.Add(Ra());
  382. sourcesList.Add(Const(0));
  383. break;
  384. }
  385. if ((flags & TextureFlags.Offset) != 0)
  386. {
  387. AddTextureOffset(type.GetDimensions(), 4, 4);
  388. }
  389. }
  390. else if (op is OpCodeTld4s tld4sOp)
  391. {
  392. if (!(tld4sOp.HasDepthCompare || tld4sOp.HasOffset))
  393. {
  394. sourcesList.Add(Ra());
  395. sourcesList.Add(Rb());
  396. }
  397. else
  398. {
  399. sourcesList.Add(Ra());
  400. sourcesList.Add(Ra());
  401. }
  402. type = SamplerType.Texture2D;
  403. flags = TextureFlags.Gather;
  404. if (tld4sOp.HasDepthCompare)
  405. {
  406. sourcesList.Add(Rb());
  407. type |= SamplerType.Shadow;
  408. }
  409. if (tld4sOp.HasOffset)
  410. {
  411. AddTextureOffset(type.GetDimensions(), 8, 6);
  412. flags |= TextureFlags.Offset;
  413. }
  414. sourcesList.Add(Const(tld4sOp.GatherCompIndex));
  415. }
  416. else
  417. {
  418. throw new InvalidOperationException($"Invalid opcode type \"{op.GetType().Name}\".");
  419. }
  420. Operand[] sources = sourcesList.ToArray();
  421. Operand[] rd0 = new Operand[2] { ConstF(0), ConstF(0) };
  422. Operand[] rd1 = new Operand[2] { ConstF(0), ConstF(0) };
  423. int destIncrement = 0;
  424. Operand GetDest()
  425. {
  426. int high = destIncrement >> 1;
  427. int low = destIncrement & 1;
  428. destIncrement++;
  429. if (op.IsFp16)
  430. {
  431. return high != 0
  432. ? (rd1[low] = Local())
  433. : (rd0[low] = Local());
  434. }
  435. else
  436. {
  437. int rdIndex = high != 0 ? op.Rd1.Index : op.Rd0.Index;
  438. if (rdIndex < RegisterConsts.RegisterZeroIndex)
  439. {
  440. rdIndex += low;
  441. }
  442. return Register(rdIndex, RegisterType.Gpr);
  443. }
  444. }
  445. int handle = op.Immediate;
  446. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  447. {
  448. if ((compMask & 1) != 0)
  449. {
  450. Operand dest = GetDest();
  451. TextureOperation operation = new TextureOperation(
  452. Instruction.TextureSample,
  453. type,
  454. flags,
  455. handle,
  456. compIndex,
  457. dest,
  458. sources);
  459. context.Add(operation);
  460. }
  461. }
  462. if (op.IsFp16)
  463. {
  464. context.Copy(Register(op.Rd0), context.PackHalf2x16(rd0[0], rd0[1]));
  465. context.Copy(Register(op.Rd1), context.PackHalf2x16(rd1[0], rd1[1]));
  466. }
  467. }
  468. public static void Tld4(EmitterContext context)
  469. {
  470. IOpCodeTld4 op = (IOpCodeTld4)context.CurrOp;
  471. if (op.Rd.IsRZ)
  472. {
  473. return;
  474. }
  475. int raIndex = op.Ra.Index;
  476. int rbIndex = op.Rb.Index;
  477. Operand Ra()
  478. {
  479. if (raIndex > RegisterConsts.RegisterZeroIndex)
  480. {
  481. return Const(0);
  482. }
  483. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  484. }
  485. Operand Rb()
  486. {
  487. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  488. {
  489. return Const(0);
  490. }
  491. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  492. }
  493. Operand arrayIndex = op.IsArray ? Ra() : null;
  494. List<Operand> sourcesList = new List<Operand>();
  495. SamplerType type = ConvertSamplerType(op.Dimensions);
  496. TextureFlags flags = TextureFlags.Gather;
  497. if (op.Bindless)
  498. {
  499. sourcesList.Add(Rb());
  500. flags |= TextureFlags.Bindless;
  501. }
  502. int coordsCount = type.GetDimensions();
  503. for (int index = 0; index < coordsCount; index++)
  504. {
  505. sourcesList.Add(Ra());
  506. }
  507. if (op.IsArray)
  508. {
  509. sourcesList.Add(arrayIndex);
  510. type |= SamplerType.Array;
  511. }
  512. Operand[] packedOffs = new Operand[2];
  513. packedOffs[0] = op.Offset != TextureGatherOffset.None ? Rb() : null;
  514. packedOffs[1] = op.Offset == TextureGatherOffset.Offsets ? Rb() : null;
  515. if (op.HasDepthCompare)
  516. {
  517. sourcesList.Add(Rb());
  518. type |= SamplerType.Shadow;
  519. }
  520. if (op.Offset != TextureGatherOffset.None)
  521. {
  522. int offsetTexelsCount = op.Offset == TextureGatherOffset.Offsets ? 4 : 1;
  523. for (int index = 0; index < coordsCount * offsetTexelsCount; index++)
  524. {
  525. Operand packed = packedOffs[(index >> 2) & 1];
  526. sourcesList.Add(context.BitfieldExtractS32(packed, Const((index & 3) * 8), Const(6)));
  527. }
  528. flags |= op.Offset == TextureGatherOffset.Offsets
  529. ? TextureFlags.Offsets
  530. : TextureFlags.Offset;
  531. }
  532. sourcesList.Add(Const(op.GatherCompIndex));
  533. Operand[] sources = sourcesList.ToArray();
  534. int rdIndex = op.Rd.Index;
  535. Operand GetDest()
  536. {
  537. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  538. {
  539. return Const(0);
  540. }
  541. return Register(rdIndex++, RegisterType.Gpr);
  542. }
  543. int handle = op.Immediate;
  544. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  545. {
  546. if ((compMask & 1) != 0)
  547. {
  548. Operand dest = GetDest();
  549. TextureOperation operation = new TextureOperation(
  550. Instruction.TextureSample,
  551. type,
  552. flags,
  553. handle,
  554. compIndex,
  555. dest,
  556. sources);
  557. context.Add(operation);
  558. }
  559. }
  560. }
  561. public static void TmmlB(EmitterContext context)
  562. {
  563. EmitTextureMipMapLevel(context, true);
  564. }
  565. public static void Tmml(EmitterContext context)
  566. {
  567. EmitTextureMipMapLevel(context, false);
  568. }
  569. private static void EmitTextureMipMapLevel(EmitterContext context, bool isBindless)
  570. {
  571. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  572. if (op.Rd.IsRZ)
  573. {
  574. return;
  575. }
  576. int raIndex = op.Ra.Index;
  577. int rbIndex = op.Rb.Index;
  578. Operand Ra()
  579. {
  580. if (raIndex > RegisterConsts.RegisterZeroIndex)
  581. {
  582. return Const(0);
  583. }
  584. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  585. }
  586. Operand Rb()
  587. {
  588. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  589. {
  590. return Const(0);
  591. }
  592. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  593. }
  594. TextureFlags flags = TextureFlags.None;
  595. List<Operand> sourcesList = new List<Operand>();
  596. if (isBindless)
  597. {
  598. sourcesList.Add(Rb());
  599. flags |= TextureFlags.Bindless;
  600. }
  601. SamplerType type = ConvertSamplerType(op.Dimensions);
  602. int coordsCount = type.GetDimensions();
  603. Operand arrayIndex = op.IsArray ? Ra() : null;
  604. for (int index = 0; index < coordsCount; index++)
  605. {
  606. sourcesList.Add(Ra());
  607. }
  608. if (op.IsArray)
  609. {
  610. sourcesList.Add(arrayIndex);
  611. type |= SamplerType.Array;
  612. }
  613. Operand[] sources = sourcesList.ToArray();
  614. int rdIndex = op.Rd.Index;
  615. Operand GetDest()
  616. {
  617. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  618. {
  619. return Const(0);
  620. }
  621. return Register(rdIndex++, RegisterType.Gpr);
  622. }
  623. int handle = !isBindless ? op.Immediate : 0;
  624. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  625. {
  626. if ((compMask & 1) != 0)
  627. {
  628. Operand dest = GetDest();
  629. // Components z and w aren't standard, we return 0 in this case and add a comment.
  630. if (compIndex >= 2)
  631. {
  632. context.Add(new CommentNode("Unsupported component z or w found"));
  633. context.Copy(dest, Const(0));
  634. }
  635. else
  636. {
  637. Operand tempDest = Local();
  638. TextureOperation operation = new TextureOperation(
  639. Instruction.Lod,
  640. type,
  641. flags,
  642. handle,
  643. compIndex,
  644. tempDest,
  645. sources);
  646. context.Add(operation);
  647. tempDest = context.FPMultiply(tempDest, ConstF(256.0f));
  648. Operand finalValue = context.FPConvertToS32(tempDest);
  649. context.Copy(dest, finalValue);
  650. }
  651. }
  652. }
  653. }
  654. public static void Txd(EmitterContext context)
  655. {
  656. OpCodeTxd op = (OpCodeTxd)context.CurrOp;
  657. if (op.Rd.IsRZ)
  658. {
  659. return;
  660. }
  661. int raIndex = op.Ra.Index;
  662. int rbIndex = op.Rb.Index;
  663. Operand Ra()
  664. {
  665. if (raIndex > RegisterConsts.RegisterZeroIndex)
  666. {
  667. return Const(0);
  668. }
  669. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  670. }
  671. Operand Rb()
  672. {
  673. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  674. {
  675. return Const(0);
  676. }
  677. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  678. }
  679. TextureFlags flags = TextureFlags.Derivatives;
  680. List<Operand> sourcesList = new List<Operand>();
  681. if (op.IsBindless)
  682. {
  683. sourcesList.Add(Ra());
  684. flags |= TextureFlags.Bindless;
  685. }
  686. SamplerType type = ConvertSamplerType(op.Dimensions);
  687. int coordsCount = type.GetDimensions();
  688. for (int index = 0; index < coordsCount; index++)
  689. {
  690. sourcesList.Add(Ra());
  691. }
  692. Operand packedParams = Ra();
  693. if (op.IsArray)
  694. {
  695. sourcesList.Add(context.BitwiseAnd(packedParams, Const(0xffff)));
  696. type |= SamplerType.Array;
  697. }
  698. // Derivatives (X and Y).
  699. for (int dIndex = 0; dIndex < 2 * coordsCount; dIndex++)
  700. {
  701. sourcesList.Add(Rb());
  702. }
  703. if (op.HasOffset)
  704. {
  705. for (int index = 0; index < coordsCount; index++)
  706. {
  707. sourcesList.Add(context.BitfieldExtractS32(packedParams, Const(16 + index * 4), Const(4)));
  708. }
  709. flags |= TextureFlags.Offset;
  710. }
  711. Operand[] sources = sourcesList.ToArray();
  712. int rdIndex = op.Rd.Index;
  713. Operand GetDest()
  714. {
  715. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  716. {
  717. return Const(0);
  718. }
  719. return Register(rdIndex++, RegisterType.Gpr);
  720. }
  721. int handle = !op.IsBindless ? op.Immediate : 0;
  722. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  723. {
  724. if ((compMask & 1) != 0)
  725. {
  726. Operand dest = GetDest();
  727. TextureOperation operation = new TextureOperation(
  728. Instruction.TextureSample,
  729. type,
  730. flags,
  731. handle,
  732. compIndex,
  733. dest,
  734. sources);
  735. context.Add(operation);
  736. }
  737. }
  738. }
  739. public static void Txq(EmitterContext context)
  740. {
  741. EmitTextureQuery(context, bindless: false);
  742. }
  743. public static void TxqB(EmitterContext context)
  744. {
  745. EmitTextureQuery(context, bindless: true);
  746. }
  747. private static void EmitTextureQuery(EmitterContext context, bool bindless)
  748. {
  749. OpCodeTex op = (OpCodeTex)context.CurrOp;
  750. if (op.Rd.IsRZ)
  751. {
  752. return;
  753. }
  754. TextureProperty property = (TextureProperty)op.RawOpCode.Extract(22, 6);
  755. // TODO: Validate and use property.
  756. Instruction inst = Instruction.TextureSize;
  757. SamplerType type = SamplerType.Texture2D;
  758. TextureFlags flags = bindless ? TextureFlags.Bindless : TextureFlags.None;
  759. int raIndex = op.Ra.Index;
  760. Operand Ra()
  761. {
  762. if (raIndex > RegisterConsts.RegisterZeroIndex)
  763. {
  764. return Const(0);
  765. }
  766. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  767. }
  768. List<Operand> sourcesList = new List<Operand>();
  769. if (bindless)
  770. {
  771. sourcesList.Add(Ra());
  772. }
  773. sourcesList.Add(Ra());
  774. Operand[] sources = sourcesList.ToArray();
  775. int rdIndex = op.Rd.Index;
  776. Operand GetDest()
  777. {
  778. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  779. {
  780. return Const(0);
  781. }
  782. return Register(rdIndex++, RegisterType.Gpr);
  783. }
  784. int handle = !bindless ? op.Immediate : 0;
  785. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  786. {
  787. if ((compMask & 1) != 0)
  788. {
  789. Operand dest = GetDest();
  790. TextureOperation operation = new TextureOperation(
  791. inst,
  792. type,
  793. flags,
  794. handle,
  795. compIndex,
  796. dest,
  797. sources);
  798. context.Add(operation);
  799. }
  800. }
  801. }
  802. private static void EmitTextureSample(EmitterContext context, TextureFlags flags)
  803. {
  804. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  805. bool isBindless = (flags & TextureFlags.Bindless) != 0;
  806. if (op.Rd.IsRZ)
  807. {
  808. return;
  809. }
  810. int raIndex = op.Ra.Index;
  811. int rbIndex = op.Rb.Index;
  812. Operand Ra()
  813. {
  814. if (raIndex > RegisterConsts.RegisterZeroIndex)
  815. {
  816. return Const(0);
  817. }
  818. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  819. }
  820. Operand Rb()
  821. {
  822. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  823. {
  824. return Const(0);
  825. }
  826. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  827. }
  828. Operand arrayIndex = op.IsArray ? Ra() : null;
  829. List<Operand> sourcesList = new List<Operand>();
  830. if (isBindless)
  831. {
  832. sourcesList.Add(Rb());
  833. }
  834. SamplerType type = ConvertSamplerType(op.Dimensions);
  835. bool hasLod = op.LodMode > TextureLodMode.LodZero;
  836. if (type == SamplerType.Texture1D && (flags & ~TextureFlags.Bindless) == TextureFlags.IntCoords && !(hasLod ||
  837. op.HasDepthCompare ||
  838. op.HasOffset ||
  839. op.IsArray ||
  840. op.IsMultisample))
  841. {
  842. // For bindless, we don't have any way to know the texture type,
  843. // so we assume it's texture buffer when the sampler type is 1D, since that's more common.
  844. bool isTypeBuffer = isBindless || context.Config.GpuAccessor.QueryIsTextureBuffer(op.Immediate);
  845. if (isTypeBuffer)
  846. {
  847. type = SamplerType.TextureBuffer;
  848. }
  849. }
  850. int coordsCount = type.GetDimensions();
  851. for (int index = 0; index < coordsCount; index++)
  852. {
  853. sourcesList.Add(Ra());
  854. }
  855. if (op.IsArray)
  856. {
  857. sourcesList.Add(arrayIndex);
  858. type |= SamplerType.Array;
  859. }
  860. Operand lodValue = hasLod ? Rb() : ConstF(0);
  861. Operand packedOffs = op.HasOffset ? Rb() : null;
  862. if (op.HasDepthCompare)
  863. {
  864. sourcesList.Add(Rb());
  865. type |= SamplerType.Shadow;
  866. }
  867. if ((op.LodMode == TextureLodMode.LodZero ||
  868. op.LodMode == TextureLodMode.LodLevel ||
  869. op.LodMode == TextureLodMode.LodLevelA) && !op.IsMultisample && type != SamplerType.TextureBuffer)
  870. {
  871. sourcesList.Add(lodValue);
  872. flags |= TextureFlags.LodLevel;
  873. }
  874. if (op.HasOffset)
  875. {
  876. for (int index = 0; index < coordsCount; index++)
  877. {
  878. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * 4), Const(4)));
  879. }
  880. flags |= TextureFlags.Offset;
  881. }
  882. if (op.LodMode == TextureLodMode.LodBias ||
  883. op.LodMode == TextureLodMode.LodBiasA)
  884. {
  885. sourcesList.Add(lodValue);
  886. flags |= TextureFlags.LodBias;
  887. }
  888. if (op.IsMultisample)
  889. {
  890. sourcesList.Add(Rb());
  891. type |= SamplerType.Multisample;
  892. }
  893. Operand[] sources = sourcesList.ToArray();
  894. int rdIndex = op.Rd.Index;
  895. Operand GetDest()
  896. {
  897. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  898. {
  899. return Const(0);
  900. }
  901. return Register(rdIndex++, RegisterType.Gpr);
  902. }
  903. int handle = !isBindless ? op.Immediate : 0;
  904. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  905. {
  906. if ((compMask & 1) != 0)
  907. {
  908. Operand dest = GetDest();
  909. TextureOperation operation = new TextureOperation(
  910. Instruction.TextureSample,
  911. type,
  912. flags,
  913. handle,
  914. compIndex,
  915. dest,
  916. sources);
  917. context.Add(operation);
  918. }
  919. }
  920. }
  921. private static int GetComponents(IntegerSize size)
  922. {
  923. return size switch
  924. {
  925. IntegerSize.B64 => 2,
  926. IntegerSize.B128 => 4,
  927. IntegerSize.UB128 => 4,
  928. _ => 1
  929. };
  930. }
  931. private static int GetComponentSizeInBytesLog2(IntegerSize size)
  932. {
  933. return size switch
  934. {
  935. IntegerSize.U8 => 0,
  936. IntegerSize.S8 => 0,
  937. IntegerSize.U16 => 1,
  938. IntegerSize.S16 => 1,
  939. IntegerSize.B32 => 2,
  940. IntegerSize.B64 => 3,
  941. IntegerSize.B128 => 4,
  942. IntegerSize.UB128 => 4,
  943. _ => 2
  944. };
  945. }
  946. private static TextureFormat GetTextureFormat(EmitterContext context, int handle)
  947. {
  948. // When the formatted load extension is supported, we don't need to
  949. // specify a format, we can just declare it without a format and the GPU will handle it.
  950. if (context.Config.GpuAccessor.QuerySupportsImageLoadFormatted())
  951. {
  952. return TextureFormat.Unknown;
  953. }
  954. var format = context.Config.GpuAccessor.QueryTextureFormat(handle);
  955. if (format == TextureFormat.Unknown)
  956. {
  957. context.Config.GpuAccessor.Log($"Unknown format for texture {handle}.");
  958. format = TextureFormat.R8G8B8A8Unorm;
  959. }
  960. return format;
  961. }
  962. private static TextureFormat GetTextureFormat(IntegerSize size)
  963. {
  964. return size switch
  965. {
  966. IntegerSize.U8 => TextureFormat.R8Uint,
  967. IntegerSize.S8 => TextureFormat.R8Sint,
  968. IntegerSize.U16 => TextureFormat.R16Uint,
  969. IntegerSize.S16 => TextureFormat.R16Sint,
  970. IntegerSize.B32 => TextureFormat.R32Uint,
  971. IntegerSize.B64 => TextureFormat.R32G32Uint,
  972. IntegerSize.B128 => TextureFormat.R32G32B32A32Uint,
  973. IntegerSize.UB128 => TextureFormat.R32G32B32A32Uint,
  974. _ => TextureFormat.R32Uint
  975. };
  976. }
  977. private static SamplerType ConvertSamplerType(ImageDimensions target)
  978. {
  979. return target switch
  980. {
  981. ImageDimensions.Image1D => SamplerType.Texture1D,
  982. ImageDimensions.ImageBuffer => SamplerType.TextureBuffer,
  983. ImageDimensions.Image1DArray => SamplerType.Texture1D | SamplerType.Array,
  984. ImageDimensions.Image2D => SamplerType.Texture2D,
  985. ImageDimensions.Image2DArray => SamplerType.Texture2D | SamplerType.Array,
  986. ImageDimensions.Image3D => SamplerType.Texture3D,
  987. _ => SamplerType.None
  988. };
  989. }
  990. private static SamplerType ConvertSamplerType(TextureDimensions dimensions)
  991. {
  992. return dimensions switch
  993. {
  994. TextureDimensions.Texture1D => SamplerType.Texture1D,
  995. TextureDimensions.Texture2D => SamplerType.Texture2D,
  996. TextureDimensions.Texture3D => SamplerType.Texture3D,
  997. TextureDimensions.TextureCube => SamplerType.TextureCube,
  998. _ => throw new ArgumentException($"Invalid texture dimensions \"{dimensions}\".")
  999. };
  1000. }
  1001. private static SamplerType ConvertSamplerType(TextureTarget type)
  1002. {
  1003. switch (type)
  1004. {
  1005. case TextureTarget.Texture1DLodZero:
  1006. return SamplerType.Texture1D;
  1007. case TextureTarget.Texture2D:
  1008. case TextureTarget.Texture2DLodZero:
  1009. case TextureTarget.Texture2DLodLevel:
  1010. return SamplerType.Texture2D;
  1011. case TextureTarget.Texture2DDepthCompare:
  1012. case TextureTarget.Texture2DLodLevelDepthCompare:
  1013. case TextureTarget.Texture2DLodZeroDepthCompare:
  1014. return SamplerType.Texture2D | SamplerType.Shadow;
  1015. case TextureTarget.Texture2DArray:
  1016. case TextureTarget.Texture2DArrayLodZero:
  1017. return SamplerType.Texture2D | SamplerType.Array;
  1018. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1019. return SamplerType.Texture2D | SamplerType.Array | SamplerType.Shadow;
  1020. case TextureTarget.Texture3D:
  1021. case TextureTarget.Texture3DLodZero:
  1022. return SamplerType.Texture3D;
  1023. case TextureTarget.TextureCube:
  1024. case TextureTarget.TextureCubeLodLevel:
  1025. return SamplerType.TextureCube;
  1026. }
  1027. return SamplerType.None;
  1028. }
  1029. private static SamplerType ConvertSamplerType(TexelLoadTarget type)
  1030. {
  1031. switch (type)
  1032. {
  1033. case TexelLoadTarget.Texture1DLodZero:
  1034. case TexelLoadTarget.Texture1DLodLevel:
  1035. return SamplerType.Texture1D;
  1036. case TexelLoadTarget.Texture2DLodZero:
  1037. case TexelLoadTarget.Texture2DLodZeroOffset:
  1038. case TexelLoadTarget.Texture2DLodLevel:
  1039. case TexelLoadTarget.Texture2DLodLevelOffset:
  1040. return SamplerType.Texture2D;
  1041. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1042. return SamplerType.Texture2D | SamplerType.Multisample;
  1043. case TexelLoadTarget.Texture3DLodZero:
  1044. return SamplerType.Texture3D;
  1045. case TexelLoadTarget.Texture2DArrayLodZero:
  1046. return SamplerType.Texture2D | SamplerType.Array;
  1047. }
  1048. return SamplerType.None;
  1049. }
  1050. private static TextureFlags ConvertTextureFlags(TextureTarget type)
  1051. {
  1052. switch (type)
  1053. {
  1054. case TextureTarget.Texture1DLodZero:
  1055. case TextureTarget.Texture2DLodZero:
  1056. case TextureTarget.Texture2DLodLevel:
  1057. case TextureTarget.Texture2DLodLevelDepthCompare:
  1058. case TextureTarget.Texture2DLodZeroDepthCompare:
  1059. case TextureTarget.Texture2DArrayLodZero:
  1060. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1061. case TextureTarget.Texture3DLodZero:
  1062. case TextureTarget.TextureCubeLodLevel:
  1063. return TextureFlags.LodLevel;
  1064. case TextureTarget.Texture2D:
  1065. case TextureTarget.Texture2DDepthCompare:
  1066. case TextureTarget.Texture2DArray:
  1067. case TextureTarget.Texture3D:
  1068. case TextureTarget.TextureCube:
  1069. return TextureFlags.None;
  1070. }
  1071. return TextureFlags.None;
  1072. }
  1073. private static TextureFlags ConvertTextureFlags(TexelLoadTarget type)
  1074. {
  1075. switch (type)
  1076. {
  1077. case TexelLoadTarget.Texture1DLodZero:
  1078. case TexelLoadTarget.Texture1DLodLevel:
  1079. case TexelLoadTarget.Texture2DLodZero:
  1080. case TexelLoadTarget.Texture2DLodLevel:
  1081. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1082. case TexelLoadTarget.Texture3DLodZero:
  1083. case TexelLoadTarget.Texture2DArrayLodZero:
  1084. return TextureFlags.LodLevel;
  1085. case TexelLoadTarget.Texture2DLodZeroOffset:
  1086. case TexelLoadTarget.Texture2DLodLevelOffset:
  1087. return TextureFlags.LodLevel | TextureFlags.Offset;
  1088. }
  1089. return TextureFlags.None;
  1090. }
  1091. }
  1092. }