InstEmitTexture.cs 45 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471
  1. using Ryujinx.Graphics.Shader.Decoders;
  2. using Ryujinx.Graphics.Shader.IntermediateRepresentation;
  3. using Ryujinx.Graphics.Shader.Translation;
  4. using System;
  5. using System.Collections.Generic;
  6. using static Ryujinx.Graphics.Shader.Instructions.InstEmitHelper;
  7. using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
  8. namespace Ryujinx.Graphics.Shader.Instructions
  9. {
  10. static partial class InstEmit
  11. {
  12. private const bool Sample1DAs2D = true;
  13. public static void Suld(EmitterContext context)
  14. {
  15. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  16. OpCodeImage op = (OpCodeImage)context.CurrOp;
  17. SamplerType type = ConvertSamplerType(op.Dimensions);
  18. if (type == SamplerType.None)
  19. {
  20. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  21. return;
  22. }
  23. // Rb is Rd on the SULD instruction.
  24. int rdIndex = op.Rb.Index;
  25. int raIndex = op.Ra.Index;
  26. Operand Ra()
  27. {
  28. if (raIndex > RegisterConsts.RegisterZeroIndex)
  29. {
  30. return Const(0);
  31. }
  32. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  33. }
  34. List<Operand> sourcesList = new List<Operand>();
  35. if (op.IsBindless)
  36. {
  37. sourcesList.Add(context.Copy(Register(op.Rc)));
  38. }
  39. int coordsCount = type.GetDimensions();
  40. for (int index = 0; index < coordsCount; index++)
  41. {
  42. sourcesList.Add(Ra());
  43. }
  44. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  45. {
  46. sourcesList.Add(Const(0));
  47. type &= ~SamplerType.Mask;
  48. type |= SamplerType.Texture2D;
  49. }
  50. if (type.HasFlag(SamplerType.Array))
  51. {
  52. sourcesList.Add(Ra());
  53. type |= SamplerType.Array;
  54. }
  55. Operand[] sources = sourcesList.ToArray();
  56. int handle = !op.IsBindless ? op.HandleOffset : 0;
  57. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  58. if (op.UseComponents)
  59. {
  60. int componentMask = (int)op.Components;
  61. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  62. {
  63. if ((compMask & 1) == 0)
  64. {
  65. continue;
  66. }
  67. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  68. {
  69. break;
  70. }
  71. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  72. TextureOperation operation = context.CreateTextureOperation(
  73. Instruction.ImageLoad,
  74. type,
  75. flags,
  76. handle,
  77. compIndex,
  78. rd,
  79. sources);
  80. if (!op.IsBindless)
  81. {
  82. operation.Format = context.Config.GetTextureFormat(handle);
  83. }
  84. context.Add(operation);
  85. }
  86. }
  87. else
  88. {
  89. if (op.ByteAddress)
  90. {
  91. int xIndex = op.IsBindless ? 1 : 0;
  92. sources[xIndex] = context.ShiftRightS32(sources[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  93. }
  94. int components = GetComponents(op.Size);
  95. for (int compIndex = 0; compIndex < components; compIndex++)
  96. {
  97. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  98. {
  99. break;
  100. }
  101. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  102. TextureOperation operation = context.CreateTextureOperation(
  103. Instruction.ImageLoad,
  104. type,
  105. GetTextureFormat(op.Size),
  106. flags,
  107. handle,
  108. compIndex,
  109. rd,
  110. sources);
  111. context.Add(operation);
  112. switch (op.Size)
  113. {
  114. case IntegerSize.U8: context.Copy(rd, ZeroExtendTo32(context, rd, 8)); break;
  115. case IntegerSize.U16: context.Copy(rd, ZeroExtendTo32(context, rd, 16)); break;
  116. case IntegerSize.S8: context.Copy(rd, SignExtendTo32(context, rd, 8)); break;
  117. case IntegerSize.S16: context.Copy(rd, SignExtendTo32(context, rd, 16)); break;
  118. }
  119. }
  120. }
  121. }
  122. public static void Sust(EmitterContext context)
  123. {
  124. OpCodeImage op = (OpCodeImage)context.CurrOp;
  125. SamplerType type = ConvertSamplerType(op.Dimensions);
  126. if (type == SamplerType.None)
  127. {
  128. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  129. return;
  130. }
  131. int raIndex = op.Ra.Index;
  132. int rbIndex = op.Rb.Index;
  133. Operand Ra()
  134. {
  135. if (raIndex > RegisterConsts.RegisterZeroIndex)
  136. {
  137. return Const(0);
  138. }
  139. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  140. }
  141. Operand Rb()
  142. {
  143. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  144. {
  145. return Const(0);
  146. }
  147. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  148. }
  149. List<Operand> sourcesList = new List<Operand>();
  150. if (op.IsBindless)
  151. {
  152. sourcesList.Add(context.Copy(Register(op.Rc)));
  153. }
  154. int coordsCount = type.GetDimensions();
  155. for (int index = 0; index < coordsCount; index++)
  156. {
  157. sourcesList.Add(Ra());
  158. }
  159. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  160. {
  161. sourcesList.Add(Const(0));
  162. type &= ~SamplerType.Mask;
  163. type |= SamplerType.Texture2D;
  164. }
  165. if (type.HasFlag(SamplerType.Array))
  166. {
  167. sourcesList.Add(Ra());
  168. type |= SamplerType.Array;
  169. }
  170. TextureFormat format = TextureFormat.Unknown;
  171. if (op.UseComponents)
  172. {
  173. int componentMask = (int)op.Components;
  174. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  175. {
  176. if ((compMask & 1) != 0)
  177. {
  178. sourcesList.Add(Rb());
  179. }
  180. }
  181. if (!op.IsBindless)
  182. {
  183. format = context.Config.GetTextureFormat(op.HandleOffset);
  184. }
  185. }
  186. else
  187. {
  188. if (op.ByteAddress)
  189. {
  190. int xIndex = op.IsBindless ? 1 : 0;
  191. sourcesList[xIndex] = context.ShiftRightS32(sourcesList[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  192. }
  193. int components = GetComponents(op.Size);
  194. for (int compIndex = 0; compIndex < components; compIndex++)
  195. {
  196. sourcesList.Add(Rb());
  197. }
  198. format = GetTextureFormat(op.Size);
  199. }
  200. Operand[] sources = sourcesList.ToArray();
  201. int handle = !op.IsBindless ? op.HandleOffset : 0;
  202. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  203. TextureOperation operation = context.CreateTextureOperation(
  204. Instruction.ImageStore,
  205. type,
  206. format,
  207. flags,
  208. handle,
  209. 0,
  210. null,
  211. sources);
  212. context.Add(operation);
  213. }
  214. public static void Tex(EmitterContext context)
  215. {
  216. EmitTextureSample(context, TextureFlags.None);
  217. }
  218. public static void TexB(EmitterContext context)
  219. {
  220. EmitTextureSample(context, TextureFlags.Bindless);
  221. }
  222. public static void Tld(EmitterContext context)
  223. {
  224. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  225. EmitTextureSample(context, TextureFlags.IntCoords);
  226. }
  227. public static void TldB(EmitterContext context)
  228. {
  229. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  230. EmitTextureSample(context, TextureFlags.IntCoords | TextureFlags.Bindless);
  231. }
  232. public static void Texs(EmitterContext context)
  233. {
  234. OpCodeTextureScalar op = (OpCodeTextureScalar)context.CurrOp;
  235. if (op.Rd0.IsRZ && op.Rd1.IsRZ)
  236. {
  237. return;
  238. }
  239. List<Operand> sourcesList = new List<Operand>();
  240. int raIndex = op.Ra.Index;
  241. int rbIndex = op.Rb.Index;
  242. Operand Ra()
  243. {
  244. if (raIndex > RegisterConsts.RegisterZeroIndex)
  245. {
  246. return Const(0);
  247. }
  248. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  249. }
  250. Operand Rb()
  251. {
  252. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  253. {
  254. return Const(0);
  255. }
  256. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  257. }
  258. void AddTextureOffset(int coordsCount, int stride, int size)
  259. {
  260. Operand packedOffs = Rb();
  261. for (int index = 0; index < coordsCount; index++)
  262. {
  263. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * stride), Const(size)));
  264. }
  265. }
  266. SamplerType type;
  267. TextureFlags flags;
  268. if (op is OpCodeTexs texsOp)
  269. {
  270. type = ConvertSamplerType(texsOp.Target);
  271. if (type == SamplerType.None)
  272. {
  273. context.Config.GpuAccessor.Log("Invalid texture sampler type.");
  274. return;
  275. }
  276. flags = ConvertTextureFlags(texsOp.Target);
  277. // We don't need to handle 1D -> Buffer conversions here as
  278. // only texture sample with integer coordinates can ever use buffer targets.
  279. if ((type & SamplerType.Array) != 0)
  280. {
  281. Operand arrayIndex = Ra();
  282. sourcesList.Add(Ra());
  283. sourcesList.Add(Rb());
  284. sourcesList.Add(arrayIndex);
  285. if ((type & SamplerType.Shadow) != 0)
  286. {
  287. sourcesList.Add(Rb());
  288. }
  289. if ((flags & TextureFlags.LodLevel) != 0)
  290. {
  291. sourcesList.Add(ConstF(0));
  292. }
  293. }
  294. else
  295. {
  296. switch (texsOp.Target)
  297. {
  298. case TextureTarget.Texture1DLodZero:
  299. sourcesList.Add(Ra());
  300. if (Sample1DAs2D)
  301. {
  302. sourcesList.Add(ConstF(0));
  303. type &= ~SamplerType.Mask;
  304. type |= SamplerType.Texture2D;
  305. }
  306. sourcesList.Add(ConstF(0));
  307. break;
  308. case TextureTarget.Texture2D:
  309. sourcesList.Add(Ra());
  310. sourcesList.Add(Rb());
  311. break;
  312. case TextureTarget.Texture2DLodZero:
  313. sourcesList.Add(Ra());
  314. sourcesList.Add(Rb());
  315. sourcesList.Add(ConstF(0));
  316. break;
  317. case TextureTarget.Texture2DLodLevel:
  318. case TextureTarget.Texture2DDepthCompare:
  319. case TextureTarget.Texture3D:
  320. case TextureTarget.TextureCube:
  321. sourcesList.Add(Ra());
  322. sourcesList.Add(Ra());
  323. sourcesList.Add(Rb());
  324. break;
  325. case TextureTarget.Texture2DLodZeroDepthCompare:
  326. case TextureTarget.Texture3DLodZero:
  327. sourcesList.Add(Ra());
  328. sourcesList.Add(Ra());
  329. sourcesList.Add(Rb());
  330. sourcesList.Add(ConstF(0));
  331. break;
  332. case TextureTarget.Texture2DLodLevelDepthCompare:
  333. case TextureTarget.TextureCubeLodLevel:
  334. sourcesList.Add(Ra());
  335. sourcesList.Add(Ra());
  336. sourcesList.Add(Rb());
  337. sourcesList.Add(Rb());
  338. break;
  339. }
  340. }
  341. }
  342. else if (op is OpCodeTlds tldsOp)
  343. {
  344. type = ConvertSamplerType(tldsOp.Target);
  345. if (type == SamplerType.None)
  346. {
  347. context.Config.GpuAccessor.Log("Invalid texel fetch sampler type.");
  348. return;
  349. }
  350. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  351. flags = ConvertTextureFlags(tldsOp.Target) | TextureFlags.IntCoords;
  352. if (tldsOp.Target == TexelLoadTarget.Texture1DLodZero && context.Config.GpuAccessor.QueryIsTextureBuffer(tldsOp.HandleOffset))
  353. {
  354. type = SamplerType.TextureBuffer;
  355. flags &= ~TextureFlags.LodLevel;
  356. }
  357. switch (tldsOp.Target)
  358. {
  359. case TexelLoadTarget.Texture1DLodZero:
  360. sourcesList.Add(Ra());
  361. if (type != SamplerType.TextureBuffer)
  362. {
  363. if (Sample1DAs2D)
  364. {
  365. sourcesList.Add(ConstF(0));
  366. type &= ~SamplerType.Mask;
  367. type |= SamplerType.Texture2D;
  368. }
  369. sourcesList.Add(ConstF(0));
  370. }
  371. break;
  372. case TexelLoadTarget.Texture1DLodLevel:
  373. sourcesList.Add(Ra());
  374. if (Sample1DAs2D)
  375. {
  376. sourcesList.Add(ConstF(0));
  377. type &= ~SamplerType.Mask;
  378. type |= SamplerType.Texture2D;
  379. }
  380. sourcesList.Add(Rb());
  381. break;
  382. case TexelLoadTarget.Texture2DLodZero:
  383. sourcesList.Add(Ra());
  384. sourcesList.Add(Rb());
  385. sourcesList.Add(Const(0));
  386. break;
  387. case TexelLoadTarget.Texture2DLodZeroOffset:
  388. sourcesList.Add(Ra());
  389. sourcesList.Add(Ra());
  390. sourcesList.Add(Const(0));
  391. break;
  392. case TexelLoadTarget.Texture2DLodZeroMultisample:
  393. case TexelLoadTarget.Texture2DLodLevel:
  394. case TexelLoadTarget.Texture2DLodLevelOffset:
  395. sourcesList.Add(Ra());
  396. sourcesList.Add(Ra());
  397. sourcesList.Add(Rb());
  398. break;
  399. case TexelLoadTarget.Texture3DLodZero:
  400. sourcesList.Add(Ra());
  401. sourcesList.Add(Ra());
  402. sourcesList.Add(Rb());
  403. sourcesList.Add(Const(0));
  404. break;
  405. case TexelLoadTarget.Texture2DArrayLodZero:
  406. sourcesList.Add(Rb());
  407. sourcesList.Add(Rb());
  408. sourcesList.Add(Ra());
  409. sourcesList.Add(Const(0));
  410. break;
  411. }
  412. if ((flags & TextureFlags.Offset) != 0)
  413. {
  414. AddTextureOffset(type.GetDimensions(), 4, 4);
  415. }
  416. }
  417. else if (op is OpCodeTld4s tld4sOp)
  418. {
  419. if (!(tld4sOp.HasDepthCompare || tld4sOp.HasOffset))
  420. {
  421. sourcesList.Add(Ra());
  422. sourcesList.Add(Rb());
  423. }
  424. else
  425. {
  426. sourcesList.Add(Ra());
  427. sourcesList.Add(Ra());
  428. }
  429. type = SamplerType.Texture2D;
  430. flags = TextureFlags.Gather;
  431. if (tld4sOp.HasDepthCompare)
  432. {
  433. sourcesList.Add(Rb());
  434. type |= SamplerType.Shadow;
  435. }
  436. if (tld4sOp.HasOffset)
  437. {
  438. AddTextureOffset(type.GetDimensions(), 8, 6);
  439. flags |= TextureFlags.Offset;
  440. }
  441. sourcesList.Add(Const(tld4sOp.GatherCompIndex));
  442. }
  443. else
  444. {
  445. throw new InvalidOperationException($"Invalid opcode type \"{op.GetType().Name}\".");
  446. }
  447. Operand[] sources = sourcesList.ToArray();
  448. Operand[] rd0 = new Operand[2] { ConstF(0), ConstF(0) };
  449. Operand[] rd1 = new Operand[2] { ConstF(0), ConstF(0) };
  450. int destIncrement = 0;
  451. Operand GetDest()
  452. {
  453. int high = destIncrement >> 1;
  454. int low = destIncrement & 1;
  455. destIncrement++;
  456. if (op.IsFp16)
  457. {
  458. return high != 0
  459. ? (rd1[low] = Local())
  460. : (rd0[low] = Local());
  461. }
  462. else
  463. {
  464. int rdIndex = high != 0 ? op.Rd1.Index : op.Rd0.Index;
  465. if (rdIndex < RegisterConsts.RegisterZeroIndex)
  466. {
  467. rdIndex += low;
  468. }
  469. return Register(rdIndex, RegisterType.Gpr);
  470. }
  471. }
  472. int handle = op.HandleOffset;
  473. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  474. {
  475. if ((compMask & 1) != 0)
  476. {
  477. Operand dest = GetDest();
  478. TextureOperation operation = context.CreateTextureOperation(
  479. Instruction.TextureSample,
  480. type,
  481. flags,
  482. handle,
  483. compIndex,
  484. dest,
  485. sources);
  486. context.Add(operation);
  487. }
  488. }
  489. if (op.IsFp16)
  490. {
  491. context.Copy(Register(op.Rd0), context.PackHalf2x16(rd0[0], rd0[1]));
  492. context.Copy(Register(op.Rd1), context.PackHalf2x16(rd1[0], rd1[1]));
  493. }
  494. }
  495. public static void Tld4(EmitterContext context)
  496. {
  497. IOpCodeTld4 op = (IOpCodeTld4)context.CurrOp;
  498. if (op.Rd.IsRZ)
  499. {
  500. return;
  501. }
  502. int raIndex = op.Ra.Index;
  503. int rbIndex = op.Rb.Index;
  504. Operand Ra()
  505. {
  506. if (raIndex > RegisterConsts.RegisterZeroIndex)
  507. {
  508. return Const(0);
  509. }
  510. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  511. }
  512. Operand Rb()
  513. {
  514. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  515. {
  516. return Const(0);
  517. }
  518. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  519. }
  520. Operand arrayIndex = op.IsArray ? Ra() : null;
  521. List<Operand> sourcesList = new List<Operand>();
  522. SamplerType type = ConvertSamplerType(op.Dimensions);
  523. TextureFlags flags = TextureFlags.Gather;
  524. if (op.Bindless)
  525. {
  526. sourcesList.Add(Rb());
  527. flags |= TextureFlags.Bindless;
  528. }
  529. int coordsCount = type.GetDimensions();
  530. for (int index = 0; index < coordsCount; index++)
  531. {
  532. sourcesList.Add(Ra());
  533. }
  534. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  535. if (is1DTo2D)
  536. {
  537. sourcesList.Add(ConstF(0));
  538. type = SamplerType.Texture2D;
  539. }
  540. if (op.IsArray)
  541. {
  542. sourcesList.Add(arrayIndex);
  543. type |= SamplerType.Array;
  544. }
  545. Operand[] packedOffs = new Operand[2];
  546. packedOffs[0] = op.Offset != TextureGatherOffset.None ? Rb() : null;
  547. packedOffs[1] = op.Offset == TextureGatherOffset.Offsets ? Rb() : null;
  548. if (op.HasDepthCompare)
  549. {
  550. sourcesList.Add(Rb());
  551. type |= SamplerType.Shadow;
  552. }
  553. if (op.Offset != TextureGatherOffset.None)
  554. {
  555. int offsetTexelsCount = op.Offset == TextureGatherOffset.Offsets ? 4 : 1;
  556. for (int index = 0; index < coordsCount * offsetTexelsCount; index++)
  557. {
  558. Operand packed = packedOffs[(index >> 2) & 1];
  559. sourcesList.Add(context.BitfieldExtractS32(packed, Const((index & 3) * 8), Const(6)));
  560. }
  561. if (is1DTo2D)
  562. {
  563. for (int index = 0; index < offsetTexelsCount; index++)
  564. {
  565. sourcesList.Add(Const(0));
  566. }
  567. }
  568. flags |= op.Offset == TextureGatherOffset.Offsets
  569. ? TextureFlags.Offsets
  570. : TextureFlags.Offset;
  571. }
  572. sourcesList.Add(Const(op.GatherCompIndex));
  573. Operand[] sources = sourcesList.ToArray();
  574. int rdIndex = op.Rd.Index;
  575. Operand GetDest()
  576. {
  577. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  578. {
  579. return Const(0);
  580. }
  581. return Register(rdIndex++, RegisterType.Gpr);
  582. }
  583. int handle = op.HandleOffset;
  584. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  585. {
  586. if ((compMask & 1) != 0)
  587. {
  588. Operand dest = GetDest();
  589. TextureOperation operation = context.CreateTextureOperation(
  590. Instruction.TextureSample,
  591. type,
  592. flags,
  593. handle,
  594. compIndex,
  595. dest,
  596. sources);
  597. context.Add(operation);
  598. }
  599. }
  600. }
  601. public static void TmmlB(EmitterContext context)
  602. {
  603. EmitTextureMipMapLevel(context, true);
  604. }
  605. public static void Tmml(EmitterContext context)
  606. {
  607. EmitTextureMipMapLevel(context, false);
  608. }
  609. private static void EmitTextureMipMapLevel(EmitterContext context, bool isBindless)
  610. {
  611. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  612. if (op.Rd.IsRZ)
  613. {
  614. return;
  615. }
  616. int raIndex = op.Ra.Index;
  617. int rbIndex = op.Rb.Index;
  618. Operand Ra()
  619. {
  620. if (raIndex > RegisterConsts.RegisterZeroIndex)
  621. {
  622. return Const(0);
  623. }
  624. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  625. }
  626. Operand Rb()
  627. {
  628. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  629. {
  630. return Const(0);
  631. }
  632. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  633. }
  634. TextureFlags flags = TextureFlags.None;
  635. List<Operand> sourcesList = new List<Operand>();
  636. if (isBindless)
  637. {
  638. sourcesList.Add(Rb());
  639. flags |= TextureFlags.Bindless;
  640. }
  641. SamplerType type = ConvertSamplerType(op.Dimensions);
  642. int coordsCount = type.GetDimensions();
  643. Operand arrayIndex = op.IsArray ? Ra() : null;
  644. for (int index = 0; index < coordsCount; index++)
  645. {
  646. sourcesList.Add(Ra());
  647. }
  648. if (Sample1DAs2D && type == SamplerType.Texture1D)
  649. {
  650. sourcesList.Add(ConstF(0));
  651. type = SamplerType.Texture2D;
  652. }
  653. if (op.IsArray)
  654. {
  655. sourcesList.Add(arrayIndex);
  656. type |= SamplerType.Array;
  657. }
  658. Operand[] sources = sourcesList.ToArray();
  659. int rdIndex = op.Rd.Index;
  660. Operand GetDest()
  661. {
  662. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  663. {
  664. return Const(0);
  665. }
  666. return Register(rdIndex++, RegisterType.Gpr);
  667. }
  668. int handle = !isBindless ? op.HandleOffset : 0;
  669. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  670. {
  671. if ((compMask & 1) != 0)
  672. {
  673. Operand dest = GetDest();
  674. // Components z and w aren't standard, we return 0 in this case and add a comment.
  675. if (compIndex >= 2)
  676. {
  677. context.Add(new CommentNode("Unsupported component z or w found"));
  678. context.Copy(dest, Const(0));
  679. }
  680. else
  681. {
  682. Operand tempDest = Local();
  683. TextureOperation operation = context.CreateTextureOperation(
  684. Instruction.Lod,
  685. type,
  686. flags,
  687. handle,
  688. compIndex ^ 1, // The instruction component order is the inverse of GLSL's.
  689. tempDest,
  690. sources);
  691. context.Add(operation);
  692. tempDest = context.FPMultiply(tempDest, ConstF(256.0f));
  693. Operand fixedPointValue = context.FPConvertToS32(tempDest);
  694. context.Copy(dest, fixedPointValue);
  695. }
  696. }
  697. }
  698. }
  699. public static void Txd(EmitterContext context)
  700. {
  701. OpCodeTxd op = (OpCodeTxd)context.CurrOp;
  702. if (op.Rd.IsRZ)
  703. {
  704. return;
  705. }
  706. int raIndex = op.Ra.Index;
  707. int rbIndex = op.Rb.Index;
  708. Operand Ra()
  709. {
  710. if (raIndex > RegisterConsts.RegisterZeroIndex)
  711. {
  712. return Const(0);
  713. }
  714. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  715. }
  716. Operand Rb()
  717. {
  718. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  719. {
  720. return Const(0);
  721. }
  722. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  723. }
  724. TextureFlags flags = TextureFlags.Derivatives;
  725. List<Operand> sourcesList = new List<Operand>();
  726. if (op.IsBindless)
  727. {
  728. sourcesList.Add(Ra());
  729. flags |= TextureFlags.Bindless;
  730. }
  731. SamplerType type = ConvertSamplerType(op.Dimensions);
  732. int coordsCount = type.GetDimensions();
  733. for (int index = 0; index < coordsCount; index++)
  734. {
  735. sourcesList.Add(Ra());
  736. }
  737. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  738. if (is1DTo2D)
  739. {
  740. sourcesList.Add(ConstF(0));
  741. type = SamplerType.Texture2D;
  742. }
  743. Operand packedParams = Ra();
  744. if (op.IsArray)
  745. {
  746. sourcesList.Add(context.BitwiseAnd(packedParams, Const(0xffff)));
  747. type |= SamplerType.Array;
  748. }
  749. // Derivatives (X and Y).
  750. for (int dIndex = 0; dIndex < 2 * coordsCount; dIndex++)
  751. {
  752. sourcesList.Add(Rb());
  753. if (is1DTo2D)
  754. {
  755. sourcesList.Add(ConstF(0));
  756. }
  757. }
  758. if (op.HasOffset)
  759. {
  760. for (int index = 0; index < coordsCount; index++)
  761. {
  762. sourcesList.Add(context.BitfieldExtractS32(packedParams, Const(16 + index * 4), Const(4)));
  763. }
  764. if (is1DTo2D)
  765. {
  766. sourcesList.Add(Const(0));
  767. }
  768. flags |= TextureFlags.Offset;
  769. }
  770. Operand[] sources = sourcesList.ToArray();
  771. int rdIndex = op.Rd.Index;
  772. Operand GetDest()
  773. {
  774. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  775. {
  776. return Const(0);
  777. }
  778. return Register(rdIndex++, RegisterType.Gpr);
  779. }
  780. int handle = !op.IsBindless ? op.HandleOffset : 0;
  781. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  782. {
  783. if ((compMask & 1) != 0)
  784. {
  785. Operand dest = GetDest();
  786. TextureOperation operation = context.CreateTextureOperation(
  787. Instruction.TextureSample,
  788. type,
  789. flags,
  790. handle,
  791. compIndex,
  792. dest,
  793. sources);
  794. context.Add(operation);
  795. }
  796. }
  797. }
  798. public static void Txq(EmitterContext context)
  799. {
  800. EmitTextureQuery(context, bindless: false);
  801. }
  802. public static void TxqB(EmitterContext context)
  803. {
  804. EmitTextureQuery(context, bindless: true);
  805. }
  806. private static void EmitTextureQuery(EmitterContext context, bool bindless)
  807. {
  808. OpCodeTex op = (OpCodeTex)context.CurrOp;
  809. if (op.Rd.IsRZ)
  810. {
  811. return;
  812. }
  813. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  814. TextureProperty property = (TextureProperty)op.RawOpCode.Extract(22, 6);
  815. // TODO: Validate and use property.
  816. Instruction inst = Instruction.TextureSize;
  817. SamplerType type = SamplerType.Texture2D;
  818. TextureFlags flags = bindless ? TextureFlags.Bindless : TextureFlags.None;
  819. int raIndex = op.Ra.Index;
  820. Operand Ra()
  821. {
  822. if (raIndex > RegisterConsts.RegisterZeroIndex)
  823. {
  824. return Const(0);
  825. }
  826. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  827. }
  828. List<Operand> sourcesList = new List<Operand>();
  829. if (bindless)
  830. {
  831. sourcesList.Add(Ra());
  832. }
  833. sourcesList.Add(Ra());
  834. Operand[] sources = sourcesList.ToArray();
  835. int rdIndex = op.Rd.Index;
  836. Operand GetDest()
  837. {
  838. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  839. {
  840. return Const(0);
  841. }
  842. return Register(rdIndex++, RegisterType.Gpr);
  843. }
  844. int handle = !bindless ? op.HandleOffset : 0;
  845. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  846. {
  847. if ((compMask & 1) != 0)
  848. {
  849. Operand dest = GetDest();
  850. TextureOperation operation = context.CreateTextureOperation(
  851. inst,
  852. type,
  853. flags,
  854. handle,
  855. compIndex,
  856. dest,
  857. sources);
  858. context.Add(operation);
  859. }
  860. }
  861. }
  862. private static void EmitTextureSample(EmitterContext context, TextureFlags flags)
  863. {
  864. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  865. bool isBindless = (flags & TextureFlags.Bindless) != 0;
  866. if (op.Rd.IsRZ)
  867. {
  868. return;
  869. }
  870. int raIndex = op.Ra.Index;
  871. int rbIndex = op.Rb.Index;
  872. Operand Ra()
  873. {
  874. if (raIndex > RegisterConsts.RegisterZeroIndex)
  875. {
  876. return Const(0);
  877. }
  878. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  879. }
  880. Operand Rb()
  881. {
  882. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  883. {
  884. return Const(0);
  885. }
  886. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  887. }
  888. Operand arrayIndex = op.IsArray ? Ra() : null;
  889. List<Operand> sourcesList = new List<Operand>();
  890. if (isBindless)
  891. {
  892. sourcesList.Add(Rb());
  893. }
  894. SamplerType type = ConvertSamplerType(op.Dimensions);
  895. bool hasLod = op.LodMode > TextureLodMode.LodZero;
  896. if (type == SamplerType.Texture1D && (flags & ~TextureFlags.Bindless) == TextureFlags.IntCoords && !(hasLod ||
  897. op.HasDepthCompare ||
  898. op.HasOffset ||
  899. op.IsArray ||
  900. op.IsMultisample))
  901. {
  902. // For bindless, we don't have any way to know the texture type,
  903. // so we assume it's texture buffer when the sampler type is 1D, since that's more common.
  904. bool isTypeBuffer = isBindless || context.Config.GpuAccessor.QueryIsTextureBuffer(op.HandleOffset);
  905. if (isTypeBuffer)
  906. {
  907. type = SamplerType.TextureBuffer;
  908. }
  909. }
  910. int coordsCount = type.GetDimensions();
  911. for (int index = 0; index < coordsCount; index++)
  912. {
  913. sourcesList.Add(Ra());
  914. }
  915. if (Sample1DAs2D && type == SamplerType.Texture1D)
  916. {
  917. sourcesList.Add(ConstF(0));
  918. type = SamplerType.Texture2D;
  919. }
  920. if (op.IsArray)
  921. {
  922. sourcesList.Add(arrayIndex);
  923. type |= SamplerType.Array;
  924. }
  925. Operand lodValue = hasLod ? Rb() : ConstF(0);
  926. Operand packedOffs = op.HasOffset ? Rb() : null;
  927. if (op.HasDepthCompare)
  928. {
  929. sourcesList.Add(Rb());
  930. type |= SamplerType.Shadow;
  931. }
  932. if ((op.LodMode == TextureLodMode.LodZero ||
  933. op.LodMode == TextureLodMode.LodLevel ||
  934. op.LodMode == TextureLodMode.LodLevelA) && !op.IsMultisample && type != SamplerType.TextureBuffer)
  935. {
  936. sourcesList.Add(lodValue);
  937. flags |= TextureFlags.LodLevel;
  938. }
  939. if (op.HasOffset)
  940. {
  941. for (int index = 0; index < coordsCount; index++)
  942. {
  943. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * 4), Const(4)));
  944. }
  945. flags |= TextureFlags.Offset;
  946. }
  947. if (op.LodMode == TextureLodMode.LodBias ||
  948. op.LodMode == TextureLodMode.LodBiasA)
  949. {
  950. sourcesList.Add(lodValue);
  951. flags |= TextureFlags.LodBias;
  952. }
  953. if (op.IsMultisample)
  954. {
  955. sourcesList.Add(Rb());
  956. type |= SamplerType.Multisample;
  957. }
  958. Operand[] sources = sourcesList.ToArray();
  959. int rdIndex = op.Rd.Index;
  960. Operand GetDest()
  961. {
  962. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  963. {
  964. return Const(0);
  965. }
  966. return Register(rdIndex++, RegisterType.Gpr);
  967. }
  968. int handle = !isBindless ? op.HandleOffset : 0;
  969. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  970. {
  971. if ((compMask & 1) != 0)
  972. {
  973. Operand dest = GetDest();
  974. TextureOperation operation = context.CreateTextureOperation(
  975. Instruction.TextureSample,
  976. type,
  977. flags,
  978. handle,
  979. compIndex,
  980. dest,
  981. sources);
  982. context.Add(operation);
  983. }
  984. }
  985. }
  986. private static int GetComponents(IntegerSize size)
  987. {
  988. return size switch
  989. {
  990. IntegerSize.B64 => 2,
  991. IntegerSize.B128 => 4,
  992. IntegerSize.UB128 => 4,
  993. _ => 1
  994. };
  995. }
  996. private static int GetComponentSizeInBytesLog2(IntegerSize size)
  997. {
  998. return size switch
  999. {
  1000. IntegerSize.U8 => 0,
  1001. IntegerSize.S8 => 0,
  1002. IntegerSize.U16 => 1,
  1003. IntegerSize.S16 => 1,
  1004. IntegerSize.B32 => 2,
  1005. IntegerSize.B64 => 3,
  1006. IntegerSize.B128 => 4,
  1007. IntegerSize.UB128 => 4,
  1008. _ => 2
  1009. };
  1010. }
  1011. private static TextureFormat GetTextureFormat(IntegerSize size)
  1012. {
  1013. return size switch
  1014. {
  1015. IntegerSize.U8 => TextureFormat.R8Uint,
  1016. IntegerSize.S8 => TextureFormat.R8Sint,
  1017. IntegerSize.U16 => TextureFormat.R16Uint,
  1018. IntegerSize.S16 => TextureFormat.R16Sint,
  1019. IntegerSize.B32 => TextureFormat.R32Uint,
  1020. IntegerSize.B64 => TextureFormat.R32G32Uint,
  1021. IntegerSize.B128 => TextureFormat.R32G32B32A32Uint,
  1022. IntegerSize.UB128 => TextureFormat.R32G32B32A32Uint,
  1023. _ => TextureFormat.R32Uint
  1024. };
  1025. }
  1026. private static SamplerType ConvertSamplerType(ImageDimensions target)
  1027. {
  1028. return target switch
  1029. {
  1030. ImageDimensions.Image1D => SamplerType.Texture1D,
  1031. ImageDimensions.ImageBuffer => SamplerType.TextureBuffer,
  1032. ImageDimensions.Image1DArray => SamplerType.Texture1D | SamplerType.Array,
  1033. ImageDimensions.Image2D => SamplerType.Texture2D,
  1034. ImageDimensions.Image2DArray => SamplerType.Texture2D | SamplerType.Array,
  1035. ImageDimensions.Image3D => SamplerType.Texture3D,
  1036. _ => SamplerType.None
  1037. };
  1038. }
  1039. private static SamplerType ConvertSamplerType(TextureDimensions dimensions)
  1040. {
  1041. return dimensions switch
  1042. {
  1043. TextureDimensions.Texture1D => SamplerType.Texture1D,
  1044. TextureDimensions.Texture2D => SamplerType.Texture2D,
  1045. TextureDimensions.Texture3D => SamplerType.Texture3D,
  1046. TextureDimensions.TextureCube => SamplerType.TextureCube,
  1047. _ => throw new ArgumentException($"Invalid texture dimensions \"{dimensions}\".")
  1048. };
  1049. }
  1050. private static SamplerType ConvertSamplerType(TextureTarget type)
  1051. {
  1052. switch (type)
  1053. {
  1054. case TextureTarget.Texture1DLodZero:
  1055. return SamplerType.Texture1D;
  1056. case TextureTarget.Texture2D:
  1057. case TextureTarget.Texture2DLodZero:
  1058. case TextureTarget.Texture2DLodLevel:
  1059. return SamplerType.Texture2D;
  1060. case TextureTarget.Texture2DDepthCompare:
  1061. case TextureTarget.Texture2DLodLevelDepthCompare:
  1062. case TextureTarget.Texture2DLodZeroDepthCompare:
  1063. return SamplerType.Texture2D | SamplerType.Shadow;
  1064. case TextureTarget.Texture2DArray:
  1065. case TextureTarget.Texture2DArrayLodZero:
  1066. return SamplerType.Texture2D | SamplerType.Array;
  1067. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1068. return SamplerType.Texture2D | SamplerType.Array | SamplerType.Shadow;
  1069. case TextureTarget.Texture3D:
  1070. case TextureTarget.Texture3DLodZero:
  1071. return SamplerType.Texture3D;
  1072. case TextureTarget.TextureCube:
  1073. case TextureTarget.TextureCubeLodLevel:
  1074. return SamplerType.TextureCube;
  1075. }
  1076. return SamplerType.None;
  1077. }
  1078. private static SamplerType ConvertSamplerType(TexelLoadTarget type)
  1079. {
  1080. switch (type)
  1081. {
  1082. case TexelLoadTarget.Texture1DLodZero:
  1083. case TexelLoadTarget.Texture1DLodLevel:
  1084. return SamplerType.Texture1D;
  1085. case TexelLoadTarget.Texture2DLodZero:
  1086. case TexelLoadTarget.Texture2DLodZeroOffset:
  1087. case TexelLoadTarget.Texture2DLodLevel:
  1088. case TexelLoadTarget.Texture2DLodLevelOffset:
  1089. return SamplerType.Texture2D;
  1090. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1091. return SamplerType.Texture2D | SamplerType.Multisample;
  1092. case TexelLoadTarget.Texture3DLodZero:
  1093. return SamplerType.Texture3D;
  1094. case TexelLoadTarget.Texture2DArrayLodZero:
  1095. return SamplerType.Texture2D | SamplerType.Array;
  1096. }
  1097. return SamplerType.None;
  1098. }
  1099. private static TextureFlags ConvertTextureFlags(TextureTarget type)
  1100. {
  1101. switch (type)
  1102. {
  1103. case TextureTarget.Texture1DLodZero:
  1104. case TextureTarget.Texture2DLodZero:
  1105. case TextureTarget.Texture2DLodLevel:
  1106. case TextureTarget.Texture2DLodLevelDepthCompare:
  1107. case TextureTarget.Texture2DLodZeroDepthCompare:
  1108. case TextureTarget.Texture2DArrayLodZero:
  1109. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1110. case TextureTarget.Texture3DLodZero:
  1111. case TextureTarget.TextureCubeLodLevel:
  1112. return TextureFlags.LodLevel;
  1113. case TextureTarget.Texture2D:
  1114. case TextureTarget.Texture2DDepthCompare:
  1115. case TextureTarget.Texture2DArray:
  1116. case TextureTarget.Texture3D:
  1117. case TextureTarget.TextureCube:
  1118. return TextureFlags.None;
  1119. }
  1120. return TextureFlags.None;
  1121. }
  1122. private static TextureFlags ConvertTextureFlags(TexelLoadTarget type)
  1123. {
  1124. switch (type)
  1125. {
  1126. case TexelLoadTarget.Texture1DLodZero:
  1127. case TexelLoadTarget.Texture1DLodLevel:
  1128. case TexelLoadTarget.Texture2DLodZero:
  1129. case TexelLoadTarget.Texture2DLodLevel:
  1130. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1131. case TexelLoadTarget.Texture3DLodZero:
  1132. case TexelLoadTarget.Texture2DArrayLodZero:
  1133. return TextureFlags.LodLevel;
  1134. case TexelLoadTarget.Texture2DLodZeroOffset:
  1135. case TexelLoadTarget.Texture2DLodLevelOffset:
  1136. return TextureFlags.LodLevel | TextureFlags.Offset;
  1137. }
  1138. return TextureFlags.None;
  1139. }
  1140. }
  1141. }