InstEmitTexture.cs 45 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471
  1. using Ryujinx.Graphics.Shader.Decoders;
  2. using Ryujinx.Graphics.Shader.IntermediateRepresentation;
  3. using Ryujinx.Graphics.Shader.Translation;
  4. using System;
  5. using System.Collections.Generic;
  6. using static Ryujinx.Graphics.Shader.Instructions.InstEmitHelper;
  7. using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
  8. namespace Ryujinx.Graphics.Shader.Instructions
  9. {
  10. static partial class InstEmit
  11. {
  12. private const bool Sample1DAs2D = true;
  13. public static void Suld(EmitterContext context)
  14. {
  15. OpCodeImage op = (OpCodeImage)context.CurrOp;
  16. SamplerType type = ConvertSamplerType(op.Dimensions);
  17. if (type == SamplerType.None)
  18. {
  19. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  20. return;
  21. }
  22. // Rb is Rd on the SULD instruction.
  23. int rdIndex = op.Rb.Index;
  24. int raIndex = op.Ra.Index;
  25. Operand Ra()
  26. {
  27. if (raIndex > RegisterConsts.RegisterZeroIndex)
  28. {
  29. return Const(0);
  30. }
  31. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  32. }
  33. List<Operand> sourcesList = new List<Operand>();
  34. if (op.IsBindless)
  35. {
  36. sourcesList.Add(context.Copy(Register(op.Rc)));
  37. }
  38. int coordsCount = type.GetDimensions();
  39. for (int index = 0; index < coordsCount; index++)
  40. {
  41. sourcesList.Add(Ra());
  42. }
  43. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  44. {
  45. sourcesList.Add(Const(0));
  46. type &= ~SamplerType.Mask;
  47. type |= SamplerType.Texture2D;
  48. }
  49. if (type.HasFlag(SamplerType.Array))
  50. {
  51. sourcesList.Add(Ra());
  52. type |= SamplerType.Array;
  53. }
  54. Operand[] sources = sourcesList.ToArray();
  55. int handle = !op.IsBindless ? op.Immediate : 0;
  56. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  57. if (op.UseComponents)
  58. {
  59. int componentMask = (int)op.Components;
  60. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  61. {
  62. if ((compMask & 1) == 0)
  63. {
  64. continue;
  65. }
  66. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  67. {
  68. break;
  69. }
  70. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  71. TextureOperation operation = new TextureOperation(
  72. Instruction.ImageLoad,
  73. type,
  74. flags,
  75. handle,
  76. compIndex,
  77. rd,
  78. sources);
  79. if (!op.IsBindless)
  80. {
  81. operation.Format = context.Config.GetTextureFormat(handle);
  82. }
  83. context.Add(operation);
  84. }
  85. }
  86. else
  87. {
  88. if (op.ByteAddress)
  89. {
  90. int xIndex = op.IsBindless ? 1 : 0;
  91. sources[xIndex] = context.ShiftRightS32(sources[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  92. }
  93. int components = GetComponents(op.Size);
  94. for (int compIndex = 0; compIndex < components; compIndex++)
  95. {
  96. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  97. {
  98. break;
  99. }
  100. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  101. TextureOperation operation = new TextureOperation(
  102. Instruction.ImageLoad,
  103. type,
  104. flags,
  105. handle,
  106. compIndex,
  107. rd,
  108. sources)
  109. {
  110. Format = GetTextureFormat(op.Size)
  111. };
  112. context.Add(operation);
  113. switch (op.Size)
  114. {
  115. case IntegerSize.U8: context.Copy(rd, ZeroExtendTo32(context, rd, 8)); break;
  116. case IntegerSize.U16: context.Copy(rd, ZeroExtendTo32(context, rd, 16)); break;
  117. case IntegerSize.S8: context.Copy(rd, SignExtendTo32(context, rd, 8)); break;
  118. case IntegerSize.S16: context.Copy(rd, SignExtendTo32(context, rd, 16)); break;
  119. }
  120. }
  121. }
  122. }
  123. public static void Sust(EmitterContext context)
  124. {
  125. OpCodeImage op = (OpCodeImage)context.CurrOp;
  126. SamplerType type = ConvertSamplerType(op.Dimensions);
  127. if (type == SamplerType.None)
  128. {
  129. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  130. return;
  131. }
  132. int raIndex = op.Ra.Index;
  133. int rbIndex = op.Rb.Index;
  134. Operand Ra()
  135. {
  136. if (raIndex > RegisterConsts.RegisterZeroIndex)
  137. {
  138. return Const(0);
  139. }
  140. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  141. }
  142. Operand Rb()
  143. {
  144. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  145. {
  146. return Const(0);
  147. }
  148. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  149. }
  150. List<Operand> sourcesList = new List<Operand>();
  151. if (op.IsBindless)
  152. {
  153. sourcesList.Add(context.Copy(Register(op.Rc)));
  154. }
  155. int coordsCount = type.GetDimensions();
  156. for (int index = 0; index < coordsCount; index++)
  157. {
  158. sourcesList.Add(Ra());
  159. }
  160. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  161. {
  162. sourcesList.Add(Const(0));
  163. type &= ~SamplerType.Mask;
  164. type |= SamplerType.Texture2D;
  165. }
  166. if (type.HasFlag(SamplerType.Array))
  167. {
  168. sourcesList.Add(Ra());
  169. type |= SamplerType.Array;
  170. }
  171. TextureFormat format = TextureFormat.Unknown;
  172. if (op.UseComponents)
  173. {
  174. int componentMask = (int)op.Components;
  175. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  176. {
  177. if ((compMask & 1) != 0)
  178. {
  179. sourcesList.Add(Rb());
  180. }
  181. }
  182. if (!op.IsBindless)
  183. {
  184. format = context.Config.GetTextureFormat(op.Immediate);
  185. }
  186. }
  187. else
  188. {
  189. if (op.ByteAddress)
  190. {
  191. int xIndex = op.IsBindless ? 1 : 0;
  192. sourcesList[xIndex] = context.ShiftRightS32(sourcesList[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  193. }
  194. int components = GetComponents(op.Size);
  195. for (int compIndex = 0; compIndex < components; compIndex++)
  196. {
  197. sourcesList.Add(Rb());
  198. }
  199. format = GetTextureFormat(op.Size);
  200. }
  201. Operand[] sources = sourcesList.ToArray();
  202. int handle = !op.IsBindless ? op.Immediate : 0;
  203. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  204. TextureOperation operation = new TextureOperation(
  205. Instruction.ImageStore,
  206. type,
  207. flags,
  208. handle,
  209. 0,
  210. null,
  211. sources)
  212. {
  213. Format = format
  214. };
  215. context.Add(operation);
  216. }
  217. public static void Tex(EmitterContext context)
  218. {
  219. EmitTextureSample(context, TextureFlags.None);
  220. }
  221. public static void TexB(EmitterContext context)
  222. {
  223. EmitTextureSample(context, TextureFlags.Bindless);
  224. }
  225. public static void Tld(EmitterContext context)
  226. {
  227. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  228. EmitTextureSample(context, TextureFlags.IntCoords);
  229. }
  230. public static void TldB(EmitterContext context)
  231. {
  232. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  233. EmitTextureSample(context, TextureFlags.IntCoords | TextureFlags.Bindless);
  234. }
  235. public static void Texs(EmitterContext context)
  236. {
  237. OpCodeTextureScalar op = (OpCodeTextureScalar)context.CurrOp;
  238. if (op.Rd0.IsRZ && op.Rd1.IsRZ)
  239. {
  240. return;
  241. }
  242. List<Operand> sourcesList = new List<Operand>();
  243. int raIndex = op.Ra.Index;
  244. int rbIndex = op.Rb.Index;
  245. Operand Ra()
  246. {
  247. if (raIndex > RegisterConsts.RegisterZeroIndex)
  248. {
  249. return Const(0);
  250. }
  251. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  252. }
  253. Operand Rb()
  254. {
  255. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  256. {
  257. return Const(0);
  258. }
  259. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  260. }
  261. void AddTextureOffset(int coordsCount, int stride, int size)
  262. {
  263. Operand packedOffs = Rb();
  264. for (int index = 0; index < coordsCount; index++)
  265. {
  266. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * stride), Const(size)));
  267. }
  268. }
  269. SamplerType type;
  270. TextureFlags flags;
  271. if (op is OpCodeTexs texsOp)
  272. {
  273. type = ConvertSamplerType(texsOp.Target);
  274. if (type == SamplerType.None)
  275. {
  276. context.Config.GpuAccessor.Log("Invalid texture sampler type.");
  277. return;
  278. }
  279. flags = ConvertTextureFlags(texsOp.Target);
  280. // We don't need to handle 1D -> Buffer conversions here as
  281. // only texture sample with integer coordinates can ever use buffer targets.
  282. if ((type & SamplerType.Array) != 0)
  283. {
  284. Operand arrayIndex = Ra();
  285. sourcesList.Add(Ra());
  286. sourcesList.Add(Rb());
  287. sourcesList.Add(arrayIndex);
  288. if ((type & SamplerType.Shadow) != 0)
  289. {
  290. sourcesList.Add(Rb());
  291. }
  292. if ((flags & TextureFlags.LodLevel) != 0)
  293. {
  294. sourcesList.Add(ConstF(0));
  295. }
  296. }
  297. else
  298. {
  299. switch (texsOp.Target)
  300. {
  301. case TextureTarget.Texture1DLodZero:
  302. sourcesList.Add(Ra());
  303. if (Sample1DAs2D)
  304. {
  305. sourcesList.Add(ConstF(0));
  306. type &= ~SamplerType.Mask;
  307. type |= SamplerType.Texture2D;
  308. }
  309. sourcesList.Add(ConstF(0));
  310. break;
  311. case TextureTarget.Texture2D:
  312. sourcesList.Add(Ra());
  313. sourcesList.Add(Rb());
  314. break;
  315. case TextureTarget.Texture2DLodZero:
  316. sourcesList.Add(Ra());
  317. sourcesList.Add(Rb());
  318. sourcesList.Add(ConstF(0));
  319. break;
  320. case TextureTarget.Texture2DLodLevel:
  321. case TextureTarget.Texture2DDepthCompare:
  322. case TextureTarget.Texture3D:
  323. case TextureTarget.TextureCube:
  324. sourcesList.Add(Ra());
  325. sourcesList.Add(Ra());
  326. sourcesList.Add(Rb());
  327. break;
  328. case TextureTarget.Texture2DLodZeroDepthCompare:
  329. case TextureTarget.Texture3DLodZero:
  330. sourcesList.Add(Ra());
  331. sourcesList.Add(Ra());
  332. sourcesList.Add(Rb());
  333. sourcesList.Add(ConstF(0));
  334. break;
  335. case TextureTarget.Texture2DLodLevelDepthCompare:
  336. case TextureTarget.TextureCubeLodLevel:
  337. sourcesList.Add(Ra());
  338. sourcesList.Add(Ra());
  339. sourcesList.Add(Rb());
  340. sourcesList.Add(Rb());
  341. break;
  342. }
  343. }
  344. }
  345. else if (op is OpCodeTlds tldsOp)
  346. {
  347. type = ConvertSamplerType(tldsOp.Target);
  348. if (type == SamplerType.None)
  349. {
  350. context.Config.GpuAccessor.Log("Invalid texel fetch sampler type.");
  351. return;
  352. }
  353. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  354. flags = ConvertTextureFlags(tldsOp.Target) | TextureFlags.IntCoords;
  355. if (tldsOp.Target == TexelLoadTarget.Texture1DLodZero && context.Config.GpuAccessor.QueryIsTextureBuffer(tldsOp.Immediate))
  356. {
  357. type = SamplerType.TextureBuffer;
  358. flags &= ~TextureFlags.LodLevel;
  359. }
  360. switch (tldsOp.Target)
  361. {
  362. case TexelLoadTarget.Texture1DLodZero:
  363. sourcesList.Add(Ra());
  364. if (type != SamplerType.TextureBuffer)
  365. {
  366. if (Sample1DAs2D)
  367. {
  368. sourcesList.Add(ConstF(0));
  369. type &= ~SamplerType.Mask;
  370. type |= SamplerType.Texture2D;
  371. }
  372. sourcesList.Add(ConstF(0));
  373. }
  374. break;
  375. case TexelLoadTarget.Texture1DLodLevel:
  376. sourcesList.Add(Ra());
  377. if (Sample1DAs2D)
  378. {
  379. sourcesList.Add(ConstF(0));
  380. type &= ~SamplerType.Mask;
  381. type |= SamplerType.Texture2D;
  382. }
  383. sourcesList.Add(Rb());
  384. break;
  385. case TexelLoadTarget.Texture2DLodZero:
  386. sourcesList.Add(Ra());
  387. sourcesList.Add(Rb());
  388. sourcesList.Add(Const(0));
  389. break;
  390. case TexelLoadTarget.Texture2DLodZeroOffset:
  391. sourcesList.Add(Ra());
  392. sourcesList.Add(Ra());
  393. sourcesList.Add(Const(0));
  394. break;
  395. case TexelLoadTarget.Texture2DLodZeroMultisample:
  396. case TexelLoadTarget.Texture2DLodLevel:
  397. case TexelLoadTarget.Texture2DLodLevelOffset:
  398. sourcesList.Add(Ra());
  399. sourcesList.Add(Ra());
  400. sourcesList.Add(Rb());
  401. break;
  402. case TexelLoadTarget.Texture3DLodZero:
  403. sourcesList.Add(Ra());
  404. sourcesList.Add(Ra());
  405. sourcesList.Add(Rb());
  406. sourcesList.Add(Const(0));
  407. break;
  408. case TexelLoadTarget.Texture2DArrayLodZero:
  409. sourcesList.Add(Rb());
  410. sourcesList.Add(Rb());
  411. sourcesList.Add(Ra());
  412. sourcesList.Add(Const(0));
  413. break;
  414. }
  415. if ((flags & TextureFlags.Offset) != 0)
  416. {
  417. AddTextureOffset(type.GetDimensions(), 4, 4);
  418. }
  419. }
  420. else if (op is OpCodeTld4s tld4sOp)
  421. {
  422. if (!(tld4sOp.HasDepthCompare || tld4sOp.HasOffset))
  423. {
  424. sourcesList.Add(Ra());
  425. sourcesList.Add(Rb());
  426. }
  427. else
  428. {
  429. sourcesList.Add(Ra());
  430. sourcesList.Add(Ra());
  431. }
  432. type = SamplerType.Texture2D;
  433. flags = TextureFlags.Gather;
  434. if (tld4sOp.HasDepthCompare)
  435. {
  436. sourcesList.Add(Rb());
  437. type |= SamplerType.Shadow;
  438. }
  439. if (tld4sOp.HasOffset)
  440. {
  441. AddTextureOffset(type.GetDimensions(), 8, 6);
  442. flags |= TextureFlags.Offset;
  443. }
  444. sourcesList.Add(Const(tld4sOp.GatherCompIndex));
  445. }
  446. else
  447. {
  448. throw new InvalidOperationException($"Invalid opcode type \"{op.GetType().Name}\".");
  449. }
  450. Operand[] sources = sourcesList.ToArray();
  451. Operand[] rd0 = new Operand[2] { ConstF(0), ConstF(0) };
  452. Operand[] rd1 = new Operand[2] { ConstF(0), ConstF(0) };
  453. int destIncrement = 0;
  454. Operand GetDest()
  455. {
  456. int high = destIncrement >> 1;
  457. int low = destIncrement & 1;
  458. destIncrement++;
  459. if (op.IsFp16)
  460. {
  461. return high != 0
  462. ? (rd1[low] = Local())
  463. : (rd0[low] = Local());
  464. }
  465. else
  466. {
  467. int rdIndex = high != 0 ? op.Rd1.Index : op.Rd0.Index;
  468. if (rdIndex < RegisterConsts.RegisterZeroIndex)
  469. {
  470. rdIndex += low;
  471. }
  472. return Register(rdIndex, RegisterType.Gpr);
  473. }
  474. }
  475. int handle = op.Immediate;
  476. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  477. {
  478. if ((compMask & 1) != 0)
  479. {
  480. Operand dest = GetDest();
  481. TextureOperation operation = new TextureOperation(
  482. Instruction.TextureSample,
  483. type,
  484. flags,
  485. handle,
  486. compIndex,
  487. dest,
  488. sources);
  489. context.Add(operation);
  490. }
  491. }
  492. if (op.IsFp16)
  493. {
  494. context.Copy(Register(op.Rd0), context.PackHalf2x16(rd0[0], rd0[1]));
  495. context.Copy(Register(op.Rd1), context.PackHalf2x16(rd1[0], rd1[1]));
  496. }
  497. }
  498. public static void Tld4(EmitterContext context)
  499. {
  500. IOpCodeTld4 op = (IOpCodeTld4)context.CurrOp;
  501. if (op.Rd.IsRZ)
  502. {
  503. return;
  504. }
  505. int raIndex = op.Ra.Index;
  506. int rbIndex = op.Rb.Index;
  507. Operand Ra()
  508. {
  509. if (raIndex > RegisterConsts.RegisterZeroIndex)
  510. {
  511. return Const(0);
  512. }
  513. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  514. }
  515. Operand Rb()
  516. {
  517. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  518. {
  519. return Const(0);
  520. }
  521. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  522. }
  523. Operand arrayIndex = op.IsArray ? Ra() : null;
  524. List<Operand> sourcesList = new List<Operand>();
  525. SamplerType type = ConvertSamplerType(op.Dimensions);
  526. TextureFlags flags = TextureFlags.Gather;
  527. if (op.Bindless)
  528. {
  529. sourcesList.Add(Rb());
  530. flags |= TextureFlags.Bindless;
  531. }
  532. int coordsCount = type.GetDimensions();
  533. for (int index = 0; index < coordsCount; index++)
  534. {
  535. sourcesList.Add(Ra());
  536. }
  537. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  538. if (is1DTo2D)
  539. {
  540. sourcesList.Add(ConstF(0));
  541. type = SamplerType.Texture2D;
  542. }
  543. if (op.IsArray)
  544. {
  545. sourcesList.Add(arrayIndex);
  546. type |= SamplerType.Array;
  547. }
  548. Operand[] packedOffs = new Operand[2];
  549. packedOffs[0] = op.Offset != TextureGatherOffset.None ? Rb() : null;
  550. packedOffs[1] = op.Offset == TextureGatherOffset.Offsets ? Rb() : null;
  551. if (op.HasDepthCompare)
  552. {
  553. sourcesList.Add(Rb());
  554. type |= SamplerType.Shadow;
  555. }
  556. if (op.Offset != TextureGatherOffset.None)
  557. {
  558. int offsetTexelsCount = op.Offset == TextureGatherOffset.Offsets ? 4 : 1;
  559. for (int index = 0; index < coordsCount * offsetTexelsCount; index++)
  560. {
  561. Operand packed = packedOffs[(index >> 2) & 1];
  562. sourcesList.Add(context.BitfieldExtractS32(packed, Const((index & 3) * 8), Const(6)));
  563. }
  564. if (is1DTo2D)
  565. {
  566. for (int index = 0; index < offsetTexelsCount; index++)
  567. {
  568. sourcesList.Add(Const(0));
  569. }
  570. }
  571. flags |= op.Offset == TextureGatherOffset.Offsets
  572. ? TextureFlags.Offsets
  573. : TextureFlags.Offset;
  574. }
  575. sourcesList.Add(Const(op.GatherCompIndex));
  576. Operand[] sources = sourcesList.ToArray();
  577. int rdIndex = op.Rd.Index;
  578. Operand GetDest()
  579. {
  580. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  581. {
  582. return Const(0);
  583. }
  584. return Register(rdIndex++, RegisterType.Gpr);
  585. }
  586. int handle = op.Immediate;
  587. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  588. {
  589. if ((compMask & 1) != 0)
  590. {
  591. Operand dest = GetDest();
  592. TextureOperation operation = new TextureOperation(
  593. Instruction.TextureSample,
  594. type,
  595. flags,
  596. handle,
  597. compIndex,
  598. dest,
  599. sources);
  600. context.Add(operation);
  601. }
  602. }
  603. }
  604. public static void TmmlB(EmitterContext context)
  605. {
  606. EmitTextureMipMapLevel(context, true);
  607. }
  608. public static void Tmml(EmitterContext context)
  609. {
  610. EmitTextureMipMapLevel(context, false);
  611. }
  612. private static void EmitTextureMipMapLevel(EmitterContext context, bool isBindless)
  613. {
  614. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  615. if (op.Rd.IsRZ)
  616. {
  617. return;
  618. }
  619. int raIndex = op.Ra.Index;
  620. int rbIndex = op.Rb.Index;
  621. Operand Ra()
  622. {
  623. if (raIndex > RegisterConsts.RegisterZeroIndex)
  624. {
  625. return Const(0);
  626. }
  627. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  628. }
  629. Operand Rb()
  630. {
  631. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  632. {
  633. return Const(0);
  634. }
  635. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  636. }
  637. TextureFlags flags = TextureFlags.None;
  638. List<Operand> sourcesList = new List<Operand>();
  639. if (isBindless)
  640. {
  641. sourcesList.Add(Rb());
  642. flags |= TextureFlags.Bindless;
  643. }
  644. SamplerType type = ConvertSamplerType(op.Dimensions);
  645. int coordsCount = type.GetDimensions();
  646. Operand arrayIndex = op.IsArray ? Ra() : null;
  647. for (int index = 0; index < coordsCount; index++)
  648. {
  649. sourcesList.Add(Ra());
  650. }
  651. if (Sample1DAs2D && type == SamplerType.Texture1D)
  652. {
  653. sourcesList.Add(ConstF(0));
  654. type = SamplerType.Texture2D;
  655. }
  656. if (op.IsArray)
  657. {
  658. sourcesList.Add(arrayIndex);
  659. type |= SamplerType.Array;
  660. }
  661. Operand[] sources = sourcesList.ToArray();
  662. int rdIndex = op.Rd.Index;
  663. Operand GetDest()
  664. {
  665. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  666. {
  667. return Const(0);
  668. }
  669. return Register(rdIndex++, RegisterType.Gpr);
  670. }
  671. int handle = !isBindless ? op.Immediate : 0;
  672. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  673. {
  674. if ((compMask & 1) != 0)
  675. {
  676. Operand dest = GetDest();
  677. // Components z and w aren't standard, we return 0 in this case and add a comment.
  678. if (compIndex >= 2)
  679. {
  680. context.Add(new CommentNode("Unsupported component z or w found"));
  681. context.Copy(dest, Const(0));
  682. }
  683. else
  684. {
  685. Operand tempDest = Local();
  686. TextureOperation operation = new TextureOperation(
  687. Instruction.Lod,
  688. type,
  689. flags,
  690. handle,
  691. compIndex,
  692. tempDest,
  693. sources);
  694. context.Add(operation);
  695. tempDest = context.FPMultiply(tempDest, ConstF(256.0f));
  696. Operand finalValue = context.FPConvertToS32(tempDest);
  697. context.Copy(dest, finalValue);
  698. }
  699. }
  700. }
  701. }
  702. public static void Txd(EmitterContext context)
  703. {
  704. OpCodeTxd op = (OpCodeTxd)context.CurrOp;
  705. if (op.Rd.IsRZ)
  706. {
  707. return;
  708. }
  709. int raIndex = op.Ra.Index;
  710. int rbIndex = op.Rb.Index;
  711. Operand Ra()
  712. {
  713. if (raIndex > RegisterConsts.RegisterZeroIndex)
  714. {
  715. return Const(0);
  716. }
  717. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  718. }
  719. Operand Rb()
  720. {
  721. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  722. {
  723. return Const(0);
  724. }
  725. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  726. }
  727. TextureFlags flags = TextureFlags.Derivatives;
  728. List<Operand> sourcesList = new List<Operand>();
  729. if (op.IsBindless)
  730. {
  731. sourcesList.Add(Ra());
  732. flags |= TextureFlags.Bindless;
  733. }
  734. SamplerType type = ConvertSamplerType(op.Dimensions);
  735. int coordsCount = type.GetDimensions();
  736. for (int index = 0; index < coordsCount; index++)
  737. {
  738. sourcesList.Add(Ra());
  739. }
  740. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  741. if (is1DTo2D)
  742. {
  743. sourcesList.Add(ConstF(0));
  744. type = SamplerType.Texture2D;
  745. }
  746. Operand packedParams = Ra();
  747. if (op.IsArray)
  748. {
  749. sourcesList.Add(context.BitwiseAnd(packedParams, Const(0xffff)));
  750. type |= SamplerType.Array;
  751. }
  752. // Derivatives (X and Y).
  753. for (int dIndex = 0; dIndex < 2 * coordsCount; dIndex++)
  754. {
  755. sourcesList.Add(Rb());
  756. if (is1DTo2D)
  757. {
  758. sourcesList.Add(ConstF(0));
  759. }
  760. }
  761. if (op.HasOffset)
  762. {
  763. for (int index = 0; index < coordsCount; index++)
  764. {
  765. sourcesList.Add(context.BitfieldExtractS32(packedParams, Const(16 + index * 4), Const(4)));
  766. }
  767. if (is1DTo2D)
  768. {
  769. sourcesList.Add(Const(0));
  770. }
  771. flags |= TextureFlags.Offset;
  772. }
  773. Operand[] sources = sourcesList.ToArray();
  774. int rdIndex = op.Rd.Index;
  775. Operand GetDest()
  776. {
  777. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  778. {
  779. return Const(0);
  780. }
  781. return Register(rdIndex++, RegisterType.Gpr);
  782. }
  783. int handle = !op.IsBindless ? op.Immediate : 0;
  784. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  785. {
  786. if ((compMask & 1) != 0)
  787. {
  788. Operand dest = GetDest();
  789. TextureOperation operation = new TextureOperation(
  790. Instruction.TextureSample,
  791. type,
  792. flags,
  793. handle,
  794. compIndex,
  795. dest,
  796. sources);
  797. context.Add(operation);
  798. }
  799. }
  800. }
  801. public static void Txq(EmitterContext context)
  802. {
  803. EmitTextureQuery(context, bindless: false);
  804. }
  805. public static void TxqB(EmitterContext context)
  806. {
  807. EmitTextureQuery(context, bindless: true);
  808. }
  809. private static void EmitTextureQuery(EmitterContext context, bool bindless)
  810. {
  811. OpCodeTex op = (OpCodeTex)context.CurrOp;
  812. if (op.Rd.IsRZ)
  813. {
  814. return;
  815. }
  816. TextureProperty property = (TextureProperty)op.RawOpCode.Extract(22, 6);
  817. // TODO: Validate and use property.
  818. Instruction inst = Instruction.TextureSize;
  819. SamplerType type = SamplerType.Texture2D;
  820. TextureFlags flags = bindless ? TextureFlags.Bindless : TextureFlags.None;
  821. int raIndex = op.Ra.Index;
  822. Operand Ra()
  823. {
  824. if (raIndex > RegisterConsts.RegisterZeroIndex)
  825. {
  826. return Const(0);
  827. }
  828. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  829. }
  830. List<Operand> sourcesList = new List<Operand>();
  831. if (bindless)
  832. {
  833. sourcesList.Add(Ra());
  834. }
  835. sourcesList.Add(Ra());
  836. Operand[] sources = sourcesList.ToArray();
  837. int rdIndex = op.Rd.Index;
  838. Operand GetDest()
  839. {
  840. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  841. {
  842. return Const(0);
  843. }
  844. return Register(rdIndex++, RegisterType.Gpr);
  845. }
  846. int handle = !bindless ? op.Immediate : 0;
  847. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  848. {
  849. if ((compMask & 1) != 0)
  850. {
  851. Operand dest = GetDest();
  852. TextureOperation operation = new TextureOperation(
  853. inst,
  854. type,
  855. flags,
  856. handle,
  857. compIndex,
  858. dest,
  859. sources);
  860. context.Add(operation);
  861. }
  862. }
  863. }
  864. private static void EmitTextureSample(EmitterContext context, TextureFlags flags)
  865. {
  866. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  867. bool isBindless = (flags & TextureFlags.Bindless) != 0;
  868. if (op.Rd.IsRZ)
  869. {
  870. return;
  871. }
  872. int raIndex = op.Ra.Index;
  873. int rbIndex = op.Rb.Index;
  874. Operand Ra()
  875. {
  876. if (raIndex > RegisterConsts.RegisterZeroIndex)
  877. {
  878. return Const(0);
  879. }
  880. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  881. }
  882. Operand Rb()
  883. {
  884. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  885. {
  886. return Const(0);
  887. }
  888. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  889. }
  890. Operand arrayIndex = op.IsArray ? Ra() : null;
  891. List<Operand> sourcesList = new List<Operand>();
  892. if (isBindless)
  893. {
  894. sourcesList.Add(Rb());
  895. }
  896. SamplerType type = ConvertSamplerType(op.Dimensions);
  897. bool hasLod = op.LodMode > TextureLodMode.LodZero;
  898. if (type == SamplerType.Texture1D && (flags & ~TextureFlags.Bindless) == TextureFlags.IntCoords && !(hasLod ||
  899. op.HasDepthCompare ||
  900. op.HasOffset ||
  901. op.IsArray ||
  902. op.IsMultisample))
  903. {
  904. // For bindless, we don't have any way to know the texture type,
  905. // so we assume it's texture buffer when the sampler type is 1D, since that's more common.
  906. bool isTypeBuffer = isBindless || context.Config.GpuAccessor.QueryIsTextureBuffer(op.Immediate);
  907. if (isTypeBuffer)
  908. {
  909. type = SamplerType.TextureBuffer;
  910. }
  911. }
  912. int coordsCount = type.GetDimensions();
  913. for (int index = 0; index < coordsCount; index++)
  914. {
  915. sourcesList.Add(Ra());
  916. }
  917. if (Sample1DAs2D && type == SamplerType.Texture1D)
  918. {
  919. sourcesList.Add(ConstF(0));
  920. type = SamplerType.Texture2D;
  921. }
  922. if (op.IsArray)
  923. {
  924. sourcesList.Add(arrayIndex);
  925. type |= SamplerType.Array;
  926. }
  927. Operand lodValue = hasLod ? Rb() : ConstF(0);
  928. Operand packedOffs = op.HasOffset ? Rb() : null;
  929. if (op.HasDepthCompare)
  930. {
  931. sourcesList.Add(Rb());
  932. type |= SamplerType.Shadow;
  933. }
  934. if ((op.LodMode == TextureLodMode.LodZero ||
  935. op.LodMode == TextureLodMode.LodLevel ||
  936. op.LodMode == TextureLodMode.LodLevelA) && !op.IsMultisample && type != SamplerType.TextureBuffer)
  937. {
  938. sourcesList.Add(lodValue);
  939. flags |= TextureFlags.LodLevel;
  940. }
  941. if (op.HasOffset)
  942. {
  943. for (int index = 0; index < coordsCount; index++)
  944. {
  945. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * 4), Const(4)));
  946. }
  947. flags |= TextureFlags.Offset;
  948. }
  949. if (op.LodMode == TextureLodMode.LodBias ||
  950. op.LodMode == TextureLodMode.LodBiasA)
  951. {
  952. sourcesList.Add(lodValue);
  953. flags |= TextureFlags.LodBias;
  954. }
  955. if (op.IsMultisample)
  956. {
  957. sourcesList.Add(Rb());
  958. type |= SamplerType.Multisample;
  959. }
  960. Operand[] sources = sourcesList.ToArray();
  961. int rdIndex = op.Rd.Index;
  962. Operand GetDest()
  963. {
  964. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  965. {
  966. return Const(0);
  967. }
  968. return Register(rdIndex++, RegisterType.Gpr);
  969. }
  970. int handle = !isBindless ? op.Immediate : 0;
  971. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  972. {
  973. if ((compMask & 1) != 0)
  974. {
  975. Operand dest = GetDest();
  976. TextureOperation operation = new TextureOperation(
  977. Instruction.TextureSample,
  978. type,
  979. flags,
  980. handle,
  981. compIndex,
  982. dest,
  983. sources);
  984. context.Add(operation);
  985. }
  986. }
  987. }
  988. private static int GetComponents(IntegerSize size)
  989. {
  990. return size switch
  991. {
  992. IntegerSize.B64 => 2,
  993. IntegerSize.B128 => 4,
  994. IntegerSize.UB128 => 4,
  995. _ => 1
  996. };
  997. }
  998. private static int GetComponentSizeInBytesLog2(IntegerSize size)
  999. {
  1000. return size switch
  1001. {
  1002. IntegerSize.U8 => 0,
  1003. IntegerSize.S8 => 0,
  1004. IntegerSize.U16 => 1,
  1005. IntegerSize.S16 => 1,
  1006. IntegerSize.B32 => 2,
  1007. IntegerSize.B64 => 3,
  1008. IntegerSize.B128 => 4,
  1009. IntegerSize.UB128 => 4,
  1010. _ => 2
  1011. };
  1012. }
  1013. private static TextureFormat GetTextureFormat(IntegerSize size)
  1014. {
  1015. return size switch
  1016. {
  1017. IntegerSize.U8 => TextureFormat.R8Uint,
  1018. IntegerSize.S8 => TextureFormat.R8Sint,
  1019. IntegerSize.U16 => TextureFormat.R16Uint,
  1020. IntegerSize.S16 => TextureFormat.R16Sint,
  1021. IntegerSize.B32 => TextureFormat.R32Uint,
  1022. IntegerSize.B64 => TextureFormat.R32G32Uint,
  1023. IntegerSize.B128 => TextureFormat.R32G32B32A32Uint,
  1024. IntegerSize.UB128 => TextureFormat.R32G32B32A32Uint,
  1025. _ => TextureFormat.R32Uint
  1026. };
  1027. }
  1028. private static SamplerType ConvertSamplerType(ImageDimensions target)
  1029. {
  1030. return target switch
  1031. {
  1032. ImageDimensions.Image1D => SamplerType.Texture1D,
  1033. ImageDimensions.ImageBuffer => SamplerType.TextureBuffer,
  1034. ImageDimensions.Image1DArray => SamplerType.Texture1D | SamplerType.Array,
  1035. ImageDimensions.Image2D => SamplerType.Texture2D,
  1036. ImageDimensions.Image2DArray => SamplerType.Texture2D | SamplerType.Array,
  1037. ImageDimensions.Image3D => SamplerType.Texture3D,
  1038. _ => SamplerType.None
  1039. };
  1040. }
  1041. private static SamplerType ConvertSamplerType(TextureDimensions dimensions)
  1042. {
  1043. return dimensions switch
  1044. {
  1045. TextureDimensions.Texture1D => SamplerType.Texture1D,
  1046. TextureDimensions.Texture2D => SamplerType.Texture2D,
  1047. TextureDimensions.Texture3D => SamplerType.Texture3D,
  1048. TextureDimensions.TextureCube => SamplerType.TextureCube,
  1049. _ => throw new ArgumentException($"Invalid texture dimensions \"{dimensions}\".")
  1050. };
  1051. }
  1052. private static SamplerType ConvertSamplerType(TextureTarget type)
  1053. {
  1054. switch (type)
  1055. {
  1056. case TextureTarget.Texture1DLodZero:
  1057. return SamplerType.Texture1D;
  1058. case TextureTarget.Texture2D:
  1059. case TextureTarget.Texture2DLodZero:
  1060. case TextureTarget.Texture2DLodLevel:
  1061. return SamplerType.Texture2D;
  1062. case TextureTarget.Texture2DDepthCompare:
  1063. case TextureTarget.Texture2DLodLevelDepthCompare:
  1064. case TextureTarget.Texture2DLodZeroDepthCompare:
  1065. return SamplerType.Texture2D | SamplerType.Shadow;
  1066. case TextureTarget.Texture2DArray:
  1067. case TextureTarget.Texture2DArrayLodZero:
  1068. return SamplerType.Texture2D | SamplerType.Array;
  1069. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1070. return SamplerType.Texture2D | SamplerType.Array | SamplerType.Shadow;
  1071. case TextureTarget.Texture3D:
  1072. case TextureTarget.Texture3DLodZero:
  1073. return SamplerType.Texture3D;
  1074. case TextureTarget.TextureCube:
  1075. case TextureTarget.TextureCubeLodLevel:
  1076. return SamplerType.TextureCube;
  1077. }
  1078. return SamplerType.None;
  1079. }
  1080. private static SamplerType ConvertSamplerType(TexelLoadTarget type)
  1081. {
  1082. switch (type)
  1083. {
  1084. case TexelLoadTarget.Texture1DLodZero:
  1085. case TexelLoadTarget.Texture1DLodLevel:
  1086. return SamplerType.Texture1D;
  1087. case TexelLoadTarget.Texture2DLodZero:
  1088. case TexelLoadTarget.Texture2DLodZeroOffset:
  1089. case TexelLoadTarget.Texture2DLodLevel:
  1090. case TexelLoadTarget.Texture2DLodLevelOffset:
  1091. return SamplerType.Texture2D;
  1092. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1093. return SamplerType.Texture2D | SamplerType.Multisample;
  1094. case TexelLoadTarget.Texture3DLodZero:
  1095. return SamplerType.Texture3D;
  1096. case TexelLoadTarget.Texture2DArrayLodZero:
  1097. return SamplerType.Texture2D | SamplerType.Array;
  1098. }
  1099. return SamplerType.None;
  1100. }
  1101. private static TextureFlags ConvertTextureFlags(TextureTarget type)
  1102. {
  1103. switch (type)
  1104. {
  1105. case TextureTarget.Texture1DLodZero:
  1106. case TextureTarget.Texture2DLodZero:
  1107. case TextureTarget.Texture2DLodLevel:
  1108. case TextureTarget.Texture2DLodLevelDepthCompare:
  1109. case TextureTarget.Texture2DLodZeroDepthCompare:
  1110. case TextureTarget.Texture2DArrayLodZero:
  1111. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1112. case TextureTarget.Texture3DLodZero:
  1113. case TextureTarget.TextureCubeLodLevel:
  1114. return TextureFlags.LodLevel;
  1115. case TextureTarget.Texture2D:
  1116. case TextureTarget.Texture2DDepthCompare:
  1117. case TextureTarget.Texture2DArray:
  1118. case TextureTarget.Texture3D:
  1119. case TextureTarget.TextureCube:
  1120. return TextureFlags.None;
  1121. }
  1122. return TextureFlags.None;
  1123. }
  1124. private static TextureFlags ConvertTextureFlags(TexelLoadTarget type)
  1125. {
  1126. switch (type)
  1127. {
  1128. case TexelLoadTarget.Texture1DLodZero:
  1129. case TexelLoadTarget.Texture1DLodLevel:
  1130. case TexelLoadTarget.Texture2DLodZero:
  1131. case TexelLoadTarget.Texture2DLodLevel:
  1132. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1133. case TexelLoadTarget.Texture3DLodZero:
  1134. case TexelLoadTarget.Texture2DArrayLodZero:
  1135. return TextureFlags.LodLevel;
  1136. case TexelLoadTarget.Texture2DLodZeroOffset:
  1137. case TexelLoadTarget.Texture2DLodLevelOffset:
  1138. return TextureFlags.LodLevel | TextureFlags.Offset;
  1139. }
  1140. return TextureFlags.None;
  1141. }
  1142. }
  1143. }