InstEmitTexture.cs 45 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469
  1. using Ryujinx.Graphics.Shader.Decoders;
  2. using Ryujinx.Graphics.Shader.IntermediateRepresentation;
  3. using Ryujinx.Graphics.Shader.Translation;
  4. using System;
  5. using System.Collections.Generic;
  6. using static Ryujinx.Graphics.Shader.Instructions.InstEmitHelper;
  7. using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
  8. namespace Ryujinx.Graphics.Shader.Instructions
  9. {
  10. static partial class InstEmit
  11. {
  12. private const bool Sample1DAs2D = true;
  13. public static void Suld(EmitterContext context)
  14. {
  15. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  16. OpCodeImage op = (OpCodeImage)context.CurrOp;
  17. SamplerType type = ConvertSamplerType(op.Dimensions);
  18. if (type == SamplerType.None)
  19. {
  20. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  21. return;
  22. }
  23. // Rb is Rd on the SULD instruction.
  24. int rdIndex = op.Rb.Index;
  25. int raIndex = op.Ra.Index;
  26. Operand Ra()
  27. {
  28. if (raIndex > RegisterConsts.RegisterZeroIndex)
  29. {
  30. return Const(0);
  31. }
  32. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  33. }
  34. List<Operand> sourcesList = new List<Operand>();
  35. if (op.IsBindless)
  36. {
  37. sourcesList.Add(context.Copy(Register(op.Rc)));
  38. }
  39. int coordsCount = type.GetDimensions();
  40. for (int index = 0; index < coordsCount; index++)
  41. {
  42. sourcesList.Add(Ra());
  43. }
  44. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  45. {
  46. sourcesList.Add(Const(0));
  47. type &= ~SamplerType.Mask;
  48. type |= SamplerType.Texture2D;
  49. }
  50. if (type.HasFlag(SamplerType.Array))
  51. {
  52. sourcesList.Add(Ra());
  53. type |= SamplerType.Array;
  54. }
  55. Operand[] sources = sourcesList.ToArray();
  56. int handle = !op.IsBindless ? op.HandleOffset : 0;
  57. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  58. if (op.UseComponents)
  59. {
  60. int componentMask = (int)op.Components;
  61. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  62. {
  63. if ((compMask & 1) == 0)
  64. {
  65. continue;
  66. }
  67. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  68. {
  69. break;
  70. }
  71. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  72. TextureOperation operation = context.CreateTextureOperation(
  73. Instruction.ImageLoad,
  74. type,
  75. flags,
  76. handle,
  77. compIndex,
  78. rd,
  79. sources);
  80. if (!op.IsBindless)
  81. {
  82. operation.Format = context.Config.GetTextureFormat(handle);
  83. }
  84. context.Add(operation);
  85. }
  86. }
  87. else
  88. {
  89. if (op.ByteAddress)
  90. {
  91. int xIndex = op.IsBindless ? 1 : 0;
  92. sources[xIndex] = context.ShiftRightS32(sources[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  93. }
  94. int components = GetComponents(op.Size);
  95. for (int compIndex = 0; compIndex < components; compIndex++)
  96. {
  97. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  98. {
  99. break;
  100. }
  101. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  102. TextureOperation operation = context.CreateTextureOperation(
  103. Instruction.ImageLoad,
  104. type,
  105. GetTextureFormat(op.Size),
  106. flags,
  107. handle,
  108. compIndex,
  109. rd,
  110. sources);
  111. context.Add(operation);
  112. switch (op.Size)
  113. {
  114. case IntegerSize.U8: context.Copy(rd, ZeroExtendTo32(context, rd, 8)); break;
  115. case IntegerSize.U16: context.Copy(rd, ZeroExtendTo32(context, rd, 16)); break;
  116. case IntegerSize.S8: context.Copy(rd, SignExtendTo32(context, rd, 8)); break;
  117. case IntegerSize.S16: context.Copy(rd, SignExtendTo32(context, rd, 16)); break;
  118. }
  119. }
  120. }
  121. }
  122. public static void Sust(EmitterContext context)
  123. {
  124. OpCodeImage op = (OpCodeImage)context.CurrOp;
  125. SamplerType type = ConvertSamplerType(op.Dimensions);
  126. if (type == SamplerType.None)
  127. {
  128. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  129. return;
  130. }
  131. int raIndex = op.Ra.Index;
  132. int rbIndex = op.Rb.Index;
  133. Operand Ra()
  134. {
  135. if (raIndex > RegisterConsts.RegisterZeroIndex)
  136. {
  137. return Const(0);
  138. }
  139. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  140. }
  141. Operand Rb()
  142. {
  143. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  144. {
  145. return Const(0);
  146. }
  147. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  148. }
  149. List<Operand> sourcesList = new List<Operand>();
  150. if (op.IsBindless)
  151. {
  152. sourcesList.Add(context.Copy(Register(op.Rc)));
  153. }
  154. int coordsCount = type.GetDimensions();
  155. for (int index = 0; index < coordsCount; index++)
  156. {
  157. sourcesList.Add(Ra());
  158. }
  159. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  160. {
  161. sourcesList.Add(Const(0));
  162. type &= ~SamplerType.Mask;
  163. type |= SamplerType.Texture2D;
  164. }
  165. if (type.HasFlag(SamplerType.Array))
  166. {
  167. sourcesList.Add(Ra());
  168. type |= SamplerType.Array;
  169. }
  170. TextureFormat format = TextureFormat.Unknown;
  171. if (op.UseComponents)
  172. {
  173. int componentMask = (int)op.Components;
  174. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  175. {
  176. if ((compMask & 1) != 0)
  177. {
  178. sourcesList.Add(Rb());
  179. }
  180. }
  181. if (!op.IsBindless)
  182. {
  183. format = context.Config.GetTextureFormat(op.HandleOffset);
  184. }
  185. }
  186. else
  187. {
  188. if (op.ByteAddress)
  189. {
  190. int xIndex = op.IsBindless ? 1 : 0;
  191. sourcesList[xIndex] = context.ShiftRightS32(sourcesList[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  192. }
  193. int components = GetComponents(op.Size);
  194. for (int compIndex = 0; compIndex < components; compIndex++)
  195. {
  196. sourcesList.Add(Rb());
  197. }
  198. format = GetTextureFormat(op.Size);
  199. }
  200. Operand[] sources = sourcesList.ToArray();
  201. int handle = !op.IsBindless ? op.HandleOffset : 0;
  202. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  203. TextureOperation operation = context.CreateTextureOperation(
  204. Instruction.ImageStore,
  205. type,
  206. format,
  207. flags,
  208. handle,
  209. 0,
  210. null,
  211. sources);
  212. context.Add(operation);
  213. }
  214. public static void Tex(EmitterContext context)
  215. {
  216. EmitTextureSample(context, TextureFlags.None);
  217. }
  218. public static void TexB(EmitterContext context)
  219. {
  220. EmitTextureSample(context, TextureFlags.Bindless);
  221. }
  222. public static void Tld(EmitterContext context)
  223. {
  224. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  225. EmitTextureSample(context, TextureFlags.IntCoords);
  226. }
  227. public static void TldB(EmitterContext context)
  228. {
  229. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  230. EmitTextureSample(context, TextureFlags.IntCoords | TextureFlags.Bindless);
  231. }
  232. public static void Texs(EmitterContext context)
  233. {
  234. OpCodeTextureScalar op = (OpCodeTextureScalar)context.CurrOp;
  235. if (op.Rd0.IsRZ && op.Rd1.IsRZ)
  236. {
  237. return;
  238. }
  239. List<Operand> sourcesList = new List<Operand>();
  240. int raIndex = op.Ra.Index;
  241. int rbIndex = op.Rb.Index;
  242. Operand Ra()
  243. {
  244. if (raIndex > RegisterConsts.RegisterZeroIndex)
  245. {
  246. return Const(0);
  247. }
  248. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  249. }
  250. Operand Rb()
  251. {
  252. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  253. {
  254. return Const(0);
  255. }
  256. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  257. }
  258. void AddTextureOffset(int coordsCount, int stride, int size)
  259. {
  260. Operand packedOffs = Rb();
  261. for (int index = 0; index < coordsCount; index++)
  262. {
  263. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * stride), Const(size)));
  264. }
  265. }
  266. SamplerType type;
  267. TextureFlags flags;
  268. if (op is OpCodeTexs texsOp)
  269. {
  270. type = ConvertSamplerType(texsOp.Target);
  271. if (type == SamplerType.None)
  272. {
  273. context.Config.GpuAccessor.Log("Invalid texture sampler type.");
  274. return;
  275. }
  276. flags = ConvertTextureFlags(texsOp.Target);
  277. // We don't need to handle 1D -> Buffer conversions here as
  278. // only texture sample with integer coordinates can ever use buffer targets.
  279. if ((type & SamplerType.Array) != 0)
  280. {
  281. Operand arrayIndex = Ra();
  282. sourcesList.Add(Ra());
  283. sourcesList.Add(Rb());
  284. sourcesList.Add(arrayIndex);
  285. if ((type & SamplerType.Shadow) != 0)
  286. {
  287. sourcesList.Add(Rb());
  288. }
  289. if ((flags & TextureFlags.LodLevel) != 0)
  290. {
  291. sourcesList.Add(ConstF(0));
  292. }
  293. }
  294. else
  295. {
  296. switch (texsOp.Target)
  297. {
  298. case TextureTarget.Texture1DLodZero:
  299. sourcesList.Add(Ra());
  300. if (Sample1DAs2D)
  301. {
  302. sourcesList.Add(ConstF(0));
  303. type &= ~SamplerType.Mask;
  304. type |= SamplerType.Texture2D;
  305. }
  306. sourcesList.Add(ConstF(0));
  307. break;
  308. case TextureTarget.Texture2D:
  309. sourcesList.Add(Ra());
  310. sourcesList.Add(Rb());
  311. break;
  312. case TextureTarget.Texture2DLodZero:
  313. sourcesList.Add(Ra());
  314. sourcesList.Add(Rb());
  315. sourcesList.Add(ConstF(0));
  316. break;
  317. case TextureTarget.Texture2DLodLevel:
  318. case TextureTarget.Texture2DDepthCompare:
  319. case TextureTarget.Texture3D:
  320. case TextureTarget.TextureCube:
  321. sourcesList.Add(Ra());
  322. sourcesList.Add(Ra());
  323. sourcesList.Add(Rb());
  324. break;
  325. case TextureTarget.Texture2DLodZeroDepthCompare:
  326. case TextureTarget.Texture3DLodZero:
  327. sourcesList.Add(Ra());
  328. sourcesList.Add(Ra());
  329. sourcesList.Add(Rb());
  330. sourcesList.Add(ConstF(0));
  331. break;
  332. case TextureTarget.Texture2DLodLevelDepthCompare:
  333. case TextureTarget.TextureCubeLodLevel:
  334. sourcesList.Add(Ra());
  335. sourcesList.Add(Ra());
  336. sourcesList.Add(Rb());
  337. sourcesList.Add(Rb());
  338. break;
  339. }
  340. }
  341. }
  342. else if (op is OpCodeTlds tldsOp)
  343. {
  344. type = ConvertSamplerType(tldsOp.Target);
  345. if (type == SamplerType.None)
  346. {
  347. context.Config.GpuAccessor.Log("Invalid texel fetch sampler type.");
  348. return;
  349. }
  350. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  351. flags = ConvertTextureFlags(tldsOp.Target) | TextureFlags.IntCoords;
  352. if (tldsOp.Target == TexelLoadTarget.Texture1DLodZero && context.Config.GpuAccessor.QueryIsTextureBuffer(tldsOp.HandleOffset))
  353. {
  354. type = SamplerType.TextureBuffer;
  355. flags &= ~TextureFlags.LodLevel;
  356. }
  357. switch (tldsOp.Target)
  358. {
  359. case TexelLoadTarget.Texture1DLodZero:
  360. sourcesList.Add(Ra());
  361. if (type != SamplerType.TextureBuffer)
  362. {
  363. if (Sample1DAs2D)
  364. {
  365. sourcesList.Add(ConstF(0));
  366. type &= ~SamplerType.Mask;
  367. type |= SamplerType.Texture2D;
  368. }
  369. sourcesList.Add(ConstF(0));
  370. }
  371. break;
  372. case TexelLoadTarget.Texture1DLodLevel:
  373. sourcesList.Add(Ra());
  374. if (Sample1DAs2D)
  375. {
  376. sourcesList.Add(ConstF(0));
  377. type &= ~SamplerType.Mask;
  378. type |= SamplerType.Texture2D;
  379. }
  380. sourcesList.Add(Rb());
  381. break;
  382. case TexelLoadTarget.Texture2DLodZero:
  383. sourcesList.Add(Ra());
  384. sourcesList.Add(Rb());
  385. sourcesList.Add(Const(0));
  386. break;
  387. case TexelLoadTarget.Texture2DLodZeroOffset:
  388. sourcesList.Add(Ra());
  389. sourcesList.Add(Ra());
  390. sourcesList.Add(Const(0));
  391. break;
  392. case TexelLoadTarget.Texture2DLodZeroMultisample:
  393. case TexelLoadTarget.Texture2DLodLevel:
  394. case TexelLoadTarget.Texture2DLodLevelOffset:
  395. sourcesList.Add(Ra());
  396. sourcesList.Add(Ra());
  397. sourcesList.Add(Rb());
  398. break;
  399. case TexelLoadTarget.Texture3DLodZero:
  400. sourcesList.Add(Ra());
  401. sourcesList.Add(Ra());
  402. sourcesList.Add(Rb());
  403. sourcesList.Add(Const(0));
  404. break;
  405. case TexelLoadTarget.Texture2DArrayLodZero:
  406. sourcesList.Add(Rb());
  407. sourcesList.Add(Rb());
  408. sourcesList.Add(Ra());
  409. sourcesList.Add(Const(0));
  410. break;
  411. }
  412. if ((flags & TextureFlags.Offset) != 0)
  413. {
  414. AddTextureOffset(type.GetDimensions(), 4, 4);
  415. }
  416. }
  417. else if (op is OpCodeTld4s tld4sOp)
  418. {
  419. if (!(tld4sOp.HasDepthCompare || tld4sOp.HasOffset))
  420. {
  421. sourcesList.Add(Ra());
  422. sourcesList.Add(Rb());
  423. }
  424. else
  425. {
  426. sourcesList.Add(Ra());
  427. sourcesList.Add(Ra());
  428. }
  429. type = SamplerType.Texture2D;
  430. flags = TextureFlags.Gather;
  431. if (tld4sOp.HasDepthCompare)
  432. {
  433. sourcesList.Add(Rb());
  434. type |= SamplerType.Shadow;
  435. }
  436. if (tld4sOp.HasOffset)
  437. {
  438. AddTextureOffset(type.GetDimensions(), 8, 6);
  439. flags |= TextureFlags.Offset;
  440. }
  441. sourcesList.Add(Const(tld4sOp.GatherCompIndex));
  442. }
  443. else
  444. {
  445. throw new InvalidOperationException($"Invalid opcode type \"{op.GetType().Name}\".");
  446. }
  447. Operand[] sources = sourcesList.ToArray();
  448. Operand[] rd0 = new Operand[2] { ConstF(0), ConstF(0) };
  449. Operand[] rd1 = new Operand[2] { ConstF(0), ConstF(0) };
  450. int destIncrement = 0;
  451. Operand GetDest()
  452. {
  453. int high = destIncrement >> 1;
  454. int low = destIncrement & 1;
  455. destIncrement++;
  456. if (op.IsFp16)
  457. {
  458. return high != 0
  459. ? (rd1[low] = Local())
  460. : (rd0[low] = Local());
  461. }
  462. else
  463. {
  464. int rdIndex = high != 0 ? op.Rd1.Index : op.Rd0.Index;
  465. if (rdIndex < RegisterConsts.RegisterZeroIndex)
  466. {
  467. rdIndex += low;
  468. }
  469. return Register(rdIndex, RegisterType.Gpr);
  470. }
  471. }
  472. int handle = op.HandleOffset;
  473. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  474. {
  475. if ((compMask & 1) != 0)
  476. {
  477. Operand dest = GetDest();
  478. TextureOperation operation = context.CreateTextureOperation(
  479. Instruction.TextureSample,
  480. type,
  481. flags,
  482. handle,
  483. compIndex,
  484. dest,
  485. sources);
  486. context.Add(operation);
  487. }
  488. }
  489. if (op.IsFp16)
  490. {
  491. context.Copy(Register(op.Rd0), context.PackHalf2x16(rd0[0], rd0[1]));
  492. context.Copy(Register(op.Rd1), context.PackHalf2x16(rd1[0], rd1[1]));
  493. }
  494. }
  495. public static void Tld4(EmitterContext context)
  496. {
  497. IOpCodeTld4 op = (IOpCodeTld4)context.CurrOp;
  498. if (op.Rd.IsRZ)
  499. {
  500. return;
  501. }
  502. int raIndex = op.Ra.Index;
  503. int rbIndex = op.Rb.Index;
  504. Operand Ra()
  505. {
  506. if (raIndex > RegisterConsts.RegisterZeroIndex)
  507. {
  508. return Const(0);
  509. }
  510. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  511. }
  512. Operand Rb()
  513. {
  514. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  515. {
  516. return Const(0);
  517. }
  518. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  519. }
  520. Operand arrayIndex = op.IsArray ? Ra() : null;
  521. List<Operand> sourcesList = new List<Operand>();
  522. SamplerType type = ConvertSamplerType(op.Dimensions);
  523. TextureFlags flags = TextureFlags.Gather;
  524. if (op.Bindless)
  525. {
  526. sourcesList.Add(Rb());
  527. flags |= TextureFlags.Bindless;
  528. }
  529. int coordsCount = type.GetDimensions();
  530. for (int index = 0; index < coordsCount; index++)
  531. {
  532. sourcesList.Add(Ra());
  533. }
  534. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  535. if (is1DTo2D)
  536. {
  537. sourcesList.Add(ConstF(0));
  538. type = SamplerType.Texture2D;
  539. }
  540. if (op.IsArray)
  541. {
  542. sourcesList.Add(arrayIndex);
  543. type |= SamplerType.Array;
  544. }
  545. Operand[] packedOffs = new Operand[2];
  546. packedOffs[0] = op.Offset != TextureGatherOffset.None ? Rb() : null;
  547. packedOffs[1] = op.Offset == TextureGatherOffset.Offsets ? Rb() : null;
  548. if (op.HasDepthCompare)
  549. {
  550. sourcesList.Add(Rb());
  551. type |= SamplerType.Shadow;
  552. }
  553. if (op.Offset != TextureGatherOffset.None)
  554. {
  555. int offsetTexelsCount = op.Offset == TextureGatherOffset.Offsets ? 4 : 1;
  556. for (int index = 0; index < coordsCount * offsetTexelsCount; index++)
  557. {
  558. Operand packed = packedOffs[(index >> 2) & 1];
  559. sourcesList.Add(context.BitfieldExtractS32(packed, Const((index & 3) * 8), Const(6)));
  560. }
  561. if (is1DTo2D)
  562. {
  563. for (int index = 0; index < offsetTexelsCount; index++)
  564. {
  565. sourcesList.Add(Const(0));
  566. }
  567. }
  568. flags |= op.Offset == TextureGatherOffset.Offsets
  569. ? TextureFlags.Offsets
  570. : TextureFlags.Offset;
  571. }
  572. sourcesList.Add(Const(op.GatherCompIndex));
  573. Operand[] sources = sourcesList.ToArray();
  574. int rdIndex = op.Rd.Index;
  575. Operand GetDest()
  576. {
  577. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  578. {
  579. return Const(0);
  580. }
  581. return Register(rdIndex++, RegisterType.Gpr);
  582. }
  583. int handle = op.HandleOffset;
  584. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  585. {
  586. if ((compMask & 1) != 0)
  587. {
  588. Operand dest = GetDest();
  589. TextureOperation operation = context.CreateTextureOperation(
  590. Instruction.TextureSample,
  591. type,
  592. flags,
  593. handle,
  594. compIndex,
  595. dest,
  596. sources);
  597. context.Add(operation);
  598. }
  599. }
  600. }
  601. public static void TmmlB(EmitterContext context)
  602. {
  603. EmitTextureMipMapLevel(context, true);
  604. }
  605. public static void Tmml(EmitterContext context)
  606. {
  607. EmitTextureMipMapLevel(context, false);
  608. }
  609. private static void EmitTextureMipMapLevel(EmitterContext context, bool isBindless)
  610. {
  611. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  612. if (op.Rd.IsRZ)
  613. {
  614. return;
  615. }
  616. int raIndex = op.Ra.Index;
  617. int rbIndex = op.Rb.Index;
  618. Operand Ra()
  619. {
  620. if (raIndex > RegisterConsts.RegisterZeroIndex)
  621. {
  622. return Const(0);
  623. }
  624. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  625. }
  626. Operand Rb()
  627. {
  628. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  629. {
  630. return Const(0);
  631. }
  632. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  633. }
  634. TextureFlags flags = TextureFlags.None;
  635. List<Operand> sourcesList = new List<Operand>();
  636. if (isBindless)
  637. {
  638. sourcesList.Add(Rb());
  639. flags |= TextureFlags.Bindless;
  640. }
  641. SamplerType type = ConvertSamplerType(op.Dimensions);
  642. int coordsCount = type.GetDimensions();
  643. Operand arrayIndex = op.IsArray ? Ra() : null;
  644. for (int index = 0; index < coordsCount; index++)
  645. {
  646. sourcesList.Add(Ra());
  647. }
  648. if (Sample1DAs2D && type == SamplerType.Texture1D)
  649. {
  650. sourcesList.Add(ConstF(0));
  651. type = SamplerType.Texture2D;
  652. }
  653. if (op.IsArray)
  654. {
  655. sourcesList.Add(arrayIndex);
  656. type |= SamplerType.Array;
  657. }
  658. Operand[] sources = sourcesList.ToArray();
  659. int rdIndex = op.Rd.Index;
  660. Operand GetDest()
  661. {
  662. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  663. {
  664. return Const(0);
  665. }
  666. return Register(rdIndex++, RegisterType.Gpr);
  667. }
  668. int handle = !isBindless ? op.HandleOffset : 0;
  669. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  670. {
  671. if ((compMask & 1) != 0)
  672. {
  673. Operand dest = GetDest();
  674. // Components z and w aren't standard, we return 0 in this case and add a comment.
  675. if (compIndex >= 2)
  676. {
  677. context.Add(new CommentNode("Unsupported component z or w found"));
  678. context.Copy(dest, Const(0));
  679. }
  680. else
  681. {
  682. Operand tempDest = Local();
  683. TextureOperation operation = context.CreateTextureOperation(
  684. Instruction.Lod,
  685. type,
  686. flags,
  687. handle,
  688. compIndex ^ 1, // The instruction component order is the inverse of GLSL's.
  689. tempDest,
  690. sources);
  691. context.Add(operation);
  692. tempDest = context.FPMultiply(tempDest, ConstF(256.0f));
  693. Operand fixedPointValue = context.FPConvertToS32(tempDest);
  694. context.Copy(dest, fixedPointValue);
  695. }
  696. }
  697. }
  698. }
  699. public static void Txd(EmitterContext context)
  700. {
  701. OpCodeTxd op = (OpCodeTxd)context.CurrOp;
  702. if (op.Rd.IsRZ)
  703. {
  704. return;
  705. }
  706. int raIndex = op.Ra.Index;
  707. int rbIndex = op.Rb.Index;
  708. Operand Ra()
  709. {
  710. if (raIndex > RegisterConsts.RegisterZeroIndex)
  711. {
  712. return Const(0);
  713. }
  714. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  715. }
  716. Operand Rb()
  717. {
  718. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  719. {
  720. return Const(0);
  721. }
  722. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  723. }
  724. TextureFlags flags = TextureFlags.Derivatives;
  725. List<Operand> sourcesList = new List<Operand>();
  726. if (op.IsBindless)
  727. {
  728. sourcesList.Add(Ra());
  729. flags |= TextureFlags.Bindless;
  730. }
  731. SamplerType type = ConvertSamplerType(op.Dimensions);
  732. int coordsCount = type.GetDimensions();
  733. for (int index = 0; index < coordsCount; index++)
  734. {
  735. sourcesList.Add(Ra());
  736. }
  737. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  738. if (is1DTo2D)
  739. {
  740. sourcesList.Add(ConstF(0));
  741. type = SamplerType.Texture2D;
  742. }
  743. Operand packedParams = Ra();
  744. if (op.IsArray)
  745. {
  746. sourcesList.Add(context.BitwiseAnd(packedParams, Const(0xffff)));
  747. type |= SamplerType.Array;
  748. }
  749. // Derivatives (X and Y).
  750. for (int dIndex = 0; dIndex < 2 * coordsCount; dIndex++)
  751. {
  752. sourcesList.Add(Rb());
  753. if (is1DTo2D)
  754. {
  755. sourcesList.Add(ConstF(0));
  756. }
  757. }
  758. if (op.HasOffset)
  759. {
  760. for (int index = 0; index < coordsCount; index++)
  761. {
  762. sourcesList.Add(context.BitfieldExtractS32(packedParams, Const(16 + index * 4), Const(4)));
  763. }
  764. if (is1DTo2D)
  765. {
  766. sourcesList.Add(Const(0));
  767. }
  768. flags |= TextureFlags.Offset;
  769. }
  770. Operand[] sources = sourcesList.ToArray();
  771. int rdIndex = op.Rd.Index;
  772. Operand GetDest()
  773. {
  774. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  775. {
  776. return Const(0);
  777. }
  778. return Register(rdIndex++, RegisterType.Gpr);
  779. }
  780. int handle = !op.IsBindless ? op.HandleOffset : 0;
  781. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  782. {
  783. if ((compMask & 1) != 0)
  784. {
  785. Operand dest = GetDest();
  786. TextureOperation operation = context.CreateTextureOperation(
  787. Instruction.TextureSample,
  788. type,
  789. flags,
  790. handle,
  791. compIndex,
  792. dest,
  793. sources);
  794. context.Add(operation);
  795. }
  796. }
  797. }
  798. public static void Txq(EmitterContext context)
  799. {
  800. EmitTextureQuery(context, bindless: false);
  801. }
  802. public static void TxqB(EmitterContext context)
  803. {
  804. EmitTextureQuery(context, bindless: true);
  805. }
  806. private static void EmitTextureQuery(EmitterContext context, bool bindless)
  807. {
  808. OpCodeTex op = (OpCodeTex)context.CurrOp;
  809. if (op.Rd.IsRZ)
  810. {
  811. return;
  812. }
  813. TextureProperty property = (TextureProperty)op.RawOpCode.Extract(22, 6);
  814. // TODO: Validate and use property.
  815. Instruction inst = Instruction.TextureSize;
  816. SamplerType type = SamplerType.Texture2D;
  817. TextureFlags flags = bindless ? TextureFlags.Bindless : TextureFlags.None;
  818. int raIndex = op.Ra.Index;
  819. Operand Ra()
  820. {
  821. if (raIndex > RegisterConsts.RegisterZeroIndex)
  822. {
  823. return Const(0);
  824. }
  825. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  826. }
  827. List<Operand> sourcesList = new List<Operand>();
  828. if (bindless)
  829. {
  830. sourcesList.Add(Ra());
  831. }
  832. sourcesList.Add(Ra());
  833. Operand[] sources = sourcesList.ToArray();
  834. int rdIndex = op.Rd.Index;
  835. Operand GetDest()
  836. {
  837. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  838. {
  839. return Const(0);
  840. }
  841. return Register(rdIndex++, RegisterType.Gpr);
  842. }
  843. int handle = !bindless ? op.HandleOffset : 0;
  844. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  845. {
  846. if ((compMask & 1) != 0)
  847. {
  848. Operand dest = GetDest();
  849. TextureOperation operation = context.CreateTextureOperation(
  850. inst,
  851. type,
  852. flags,
  853. handle,
  854. compIndex,
  855. dest,
  856. sources);
  857. context.Add(operation);
  858. }
  859. }
  860. }
  861. private static void EmitTextureSample(EmitterContext context, TextureFlags flags)
  862. {
  863. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  864. bool isBindless = (flags & TextureFlags.Bindless) != 0;
  865. if (op.Rd.IsRZ)
  866. {
  867. return;
  868. }
  869. int raIndex = op.Ra.Index;
  870. int rbIndex = op.Rb.Index;
  871. Operand Ra()
  872. {
  873. if (raIndex > RegisterConsts.RegisterZeroIndex)
  874. {
  875. return Const(0);
  876. }
  877. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  878. }
  879. Operand Rb()
  880. {
  881. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  882. {
  883. return Const(0);
  884. }
  885. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  886. }
  887. Operand arrayIndex = op.IsArray ? Ra() : null;
  888. List<Operand> sourcesList = new List<Operand>();
  889. if (isBindless)
  890. {
  891. sourcesList.Add(Rb());
  892. }
  893. SamplerType type = ConvertSamplerType(op.Dimensions);
  894. bool hasLod = op.LodMode > TextureLodMode.LodZero;
  895. if (type == SamplerType.Texture1D && (flags & ~TextureFlags.Bindless) == TextureFlags.IntCoords && !(hasLod ||
  896. op.HasDepthCompare ||
  897. op.HasOffset ||
  898. op.IsArray ||
  899. op.IsMultisample))
  900. {
  901. // For bindless, we don't have any way to know the texture type,
  902. // so we assume it's texture buffer when the sampler type is 1D, since that's more common.
  903. bool isTypeBuffer = isBindless || context.Config.GpuAccessor.QueryIsTextureBuffer(op.HandleOffset);
  904. if (isTypeBuffer)
  905. {
  906. type = SamplerType.TextureBuffer;
  907. }
  908. }
  909. int coordsCount = type.GetDimensions();
  910. for (int index = 0; index < coordsCount; index++)
  911. {
  912. sourcesList.Add(Ra());
  913. }
  914. if (Sample1DAs2D && type == SamplerType.Texture1D)
  915. {
  916. sourcesList.Add(ConstF(0));
  917. type = SamplerType.Texture2D;
  918. }
  919. if (op.IsArray)
  920. {
  921. sourcesList.Add(arrayIndex);
  922. type |= SamplerType.Array;
  923. }
  924. Operand lodValue = hasLod ? Rb() : ConstF(0);
  925. Operand packedOffs = op.HasOffset ? Rb() : null;
  926. if (op.HasDepthCompare)
  927. {
  928. sourcesList.Add(Rb());
  929. type |= SamplerType.Shadow;
  930. }
  931. if ((op.LodMode == TextureLodMode.LodZero ||
  932. op.LodMode == TextureLodMode.LodLevel ||
  933. op.LodMode == TextureLodMode.LodLevelA) && !op.IsMultisample && type != SamplerType.TextureBuffer)
  934. {
  935. sourcesList.Add(lodValue);
  936. flags |= TextureFlags.LodLevel;
  937. }
  938. if (op.HasOffset)
  939. {
  940. for (int index = 0; index < coordsCount; index++)
  941. {
  942. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * 4), Const(4)));
  943. }
  944. flags |= TextureFlags.Offset;
  945. }
  946. if (op.LodMode == TextureLodMode.LodBias ||
  947. op.LodMode == TextureLodMode.LodBiasA)
  948. {
  949. sourcesList.Add(lodValue);
  950. flags |= TextureFlags.LodBias;
  951. }
  952. if (op.IsMultisample)
  953. {
  954. sourcesList.Add(Rb());
  955. type |= SamplerType.Multisample;
  956. }
  957. Operand[] sources = sourcesList.ToArray();
  958. int rdIndex = op.Rd.Index;
  959. Operand GetDest()
  960. {
  961. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  962. {
  963. return Const(0);
  964. }
  965. return Register(rdIndex++, RegisterType.Gpr);
  966. }
  967. int handle = !isBindless ? op.HandleOffset : 0;
  968. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  969. {
  970. if ((compMask & 1) != 0)
  971. {
  972. Operand dest = GetDest();
  973. TextureOperation operation = context.CreateTextureOperation(
  974. Instruction.TextureSample,
  975. type,
  976. flags,
  977. handle,
  978. compIndex,
  979. dest,
  980. sources);
  981. context.Add(operation);
  982. }
  983. }
  984. }
  985. private static int GetComponents(IntegerSize size)
  986. {
  987. return size switch
  988. {
  989. IntegerSize.B64 => 2,
  990. IntegerSize.B128 => 4,
  991. IntegerSize.UB128 => 4,
  992. _ => 1
  993. };
  994. }
  995. private static int GetComponentSizeInBytesLog2(IntegerSize size)
  996. {
  997. return size switch
  998. {
  999. IntegerSize.U8 => 0,
  1000. IntegerSize.S8 => 0,
  1001. IntegerSize.U16 => 1,
  1002. IntegerSize.S16 => 1,
  1003. IntegerSize.B32 => 2,
  1004. IntegerSize.B64 => 3,
  1005. IntegerSize.B128 => 4,
  1006. IntegerSize.UB128 => 4,
  1007. _ => 2
  1008. };
  1009. }
  1010. private static TextureFormat GetTextureFormat(IntegerSize size)
  1011. {
  1012. return size switch
  1013. {
  1014. IntegerSize.U8 => TextureFormat.R8Uint,
  1015. IntegerSize.S8 => TextureFormat.R8Sint,
  1016. IntegerSize.U16 => TextureFormat.R16Uint,
  1017. IntegerSize.S16 => TextureFormat.R16Sint,
  1018. IntegerSize.B32 => TextureFormat.R32Uint,
  1019. IntegerSize.B64 => TextureFormat.R32G32Uint,
  1020. IntegerSize.B128 => TextureFormat.R32G32B32A32Uint,
  1021. IntegerSize.UB128 => TextureFormat.R32G32B32A32Uint,
  1022. _ => TextureFormat.R32Uint
  1023. };
  1024. }
  1025. private static SamplerType ConvertSamplerType(ImageDimensions target)
  1026. {
  1027. return target switch
  1028. {
  1029. ImageDimensions.Image1D => SamplerType.Texture1D,
  1030. ImageDimensions.ImageBuffer => SamplerType.TextureBuffer,
  1031. ImageDimensions.Image1DArray => SamplerType.Texture1D | SamplerType.Array,
  1032. ImageDimensions.Image2D => SamplerType.Texture2D,
  1033. ImageDimensions.Image2DArray => SamplerType.Texture2D | SamplerType.Array,
  1034. ImageDimensions.Image3D => SamplerType.Texture3D,
  1035. _ => SamplerType.None
  1036. };
  1037. }
  1038. private static SamplerType ConvertSamplerType(TextureDimensions dimensions)
  1039. {
  1040. return dimensions switch
  1041. {
  1042. TextureDimensions.Texture1D => SamplerType.Texture1D,
  1043. TextureDimensions.Texture2D => SamplerType.Texture2D,
  1044. TextureDimensions.Texture3D => SamplerType.Texture3D,
  1045. TextureDimensions.TextureCube => SamplerType.TextureCube,
  1046. _ => throw new ArgumentException($"Invalid texture dimensions \"{dimensions}\".")
  1047. };
  1048. }
  1049. private static SamplerType ConvertSamplerType(TextureTarget type)
  1050. {
  1051. switch (type)
  1052. {
  1053. case TextureTarget.Texture1DLodZero:
  1054. return SamplerType.Texture1D;
  1055. case TextureTarget.Texture2D:
  1056. case TextureTarget.Texture2DLodZero:
  1057. case TextureTarget.Texture2DLodLevel:
  1058. return SamplerType.Texture2D;
  1059. case TextureTarget.Texture2DDepthCompare:
  1060. case TextureTarget.Texture2DLodLevelDepthCompare:
  1061. case TextureTarget.Texture2DLodZeroDepthCompare:
  1062. return SamplerType.Texture2D | SamplerType.Shadow;
  1063. case TextureTarget.Texture2DArray:
  1064. case TextureTarget.Texture2DArrayLodZero:
  1065. return SamplerType.Texture2D | SamplerType.Array;
  1066. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1067. return SamplerType.Texture2D | SamplerType.Array | SamplerType.Shadow;
  1068. case TextureTarget.Texture3D:
  1069. case TextureTarget.Texture3DLodZero:
  1070. return SamplerType.Texture3D;
  1071. case TextureTarget.TextureCube:
  1072. case TextureTarget.TextureCubeLodLevel:
  1073. return SamplerType.TextureCube;
  1074. }
  1075. return SamplerType.None;
  1076. }
  1077. private static SamplerType ConvertSamplerType(TexelLoadTarget type)
  1078. {
  1079. switch (type)
  1080. {
  1081. case TexelLoadTarget.Texture1DLodZero:
  1082. case TexelLoadTarget.Texture1DLodLevel:
  1083. return SamplerType.Texture1D;
  1084. case TexelLoadTarget.Texture2DLodZero:
  1085. case TexelLoadTarget.Texture2DLodZeroOffset:
  1086. case TexelLoadTarget.Texture2DLodLevel:
  1087. case TexelLoadTarget.Texture2DLodLevelOffset:
  1088. return SamplerType.Texture2D;
  1089. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1090. return SamplerType.Texture2D | SamplerType.Multisample;
  1091. case TexelLoadTarget.Texture3DLodZero:
  1092. return SamplerType.Texture3D;
  1093. case TexelLoadTarget.Texture2DArrayLodZero:
  1094. return SamplerType.Texture2D | SamplerType.Array;
  1095. }
  1096. return SamplerType.None;
  1097. }
  1098. private static TextureFlags ConvertTextureFlags(TextureTarget type)
  1099. {
  1100. switch (type)
  1101. {
  1102. case TextureTarget.Texture1DLodZero:
  1103. case TextureTarget.Texture2DLodZero:
  1104. case TextureTarget.Texture2DLodLevel:
  1105. case TextureTarget.Texture2DLodLevelDepthCompare:
  1106. case TextureTarget.Texture2DLodZeroDepthCompare:
  1107. case TextureTarget.Texture2DArrayLodZero:
  1108. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1109. case TextureTarget.Texture3DLodZero:
  1110. case TextureTarget.TextureCubeLodLevel:
  1111. return TextureFlags.LodLevel;
  1112. case TextureTarget.Texture2D:
  1113. case TextureTarget.Texture2DDepthCompare:
  1114. case TextureTarget.Texture2DArray:
  1115. case TextureTarget.Texture3D:
  1116. case TextureTarget.TextureCube:
  1117. return TextureFlags.None;
  1118. }
  1119. return TextureFlags.None;
  1120. }
  1121. private static TextureFlags ConvertTextureFlags(TexelLoadTarget type)
  1122. {
  1123. switch (type)
  1124. {
  1125. case TexelLoadTarget.Texture1DLodZero:
  1126. case TexelLoadTarget.Texture1DLodLevel:
  1127. case TexelLoadTarget.Texture2DLodZero:
  1128. case TexelLoadTarget.Texture2DLodLevel:
  1129. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1130. case TexelLoadTarget.Texture3DLodZero:
  1131. case TexelLoadTarget.Texture2DArrayLodZero:
  1132. return TextureFlags.LodLevel;
  1133. case TexelLoadTarget.Texture2DLodZeroOffset:
  1134. case TexelLoadTarget.Texture2DLodLevelOffset:
  1135. return TextureFlags.LodLevel | TextureFlags.Offset;
  1136. }
  1137. return TextureFlags.None;
  1138. }
  1139. }
  1140. }