InstEmitTexture.cs 45 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475
  1. using Ryujinx.Graphics.Shader.Decoders;
  2. using Ryujinx.Graphics.Shader.IntermediateRepresentation;
  3. using Ryujinx.Graphics.Shader.Translation;
  4. using System;
  5. using System.Collections.Generic;
  6. using static Ryujinx.Graphics.Shader.Instructions.InstEmitHelper;
  7. using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
  8. namespace Ryujinx.Graphics.Shader.Instructions
  9. {
  10. static partial class InstEmit
  11. {
  12. private const bool Sample1DAs2D = true;
  13. public static void Suld(EmitterContext context)
  14. {
  15. OpCodeImage op = (OpCodeImage)context.CurrOp;
  16. SamplerType type = ConvertSamplerType(op.Dimensions);
  17. if (type == SamplerType.None)
  18. {
  19. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  20. return;
  21. }
  22. // Rb is Rd on the SULD instruction.
  23. int rdIndex = op.Rb.Index;
  24. int raIndex = op.Ra.Index;
  25. Operand Ra()
  26. {
  27. if (raIndex > RegisterConsts.RegisterZeroIndex)
  28. {
  29. return Const(0);
  30. }
  31. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  32. }
  33. Operand arrayIndex = type.HasFlag(SamplerType.Array) ? Ra() : null;
  34. List<Operand> sourcesList = new List<Operand>();
  35. if (op.IsBindless)
  36. {
  37. sourcesList.Add(context.Copy(Register(op.Rc)));
  38. }
  39. int coordsCount = type.GetDimensions();
  40. for (int index = 0; index < coordsCount; index++)
  41. {
  42. sourcesList.Add(Ra());
  43. }
  44. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  45. {
  46. sourcesList.Add(Const(0));
  47. type &= ~SamplerType.Mask;
  48. type |= SamplerType.Texture2D;
  49. }
  50. if (type.HasFlag(SamplerType.Array))
  51. {
  52. sourcesList.Add(arrayIndex);
  53. type |= SamplerType.Array;
  54. }
  55. Operand[] sources = sourcesList.ToArray();
  56. int handle = !op.IsBindless ? op.Immediate : 0;
  57. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  58. if (op.UseComponents)
  59. {
  60. int componentMask = (int)op.Components;
  61. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  62. {
  63. if ((compMask & 1) == 0)
  64. {
  65. continue;
  66. }
  67. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  68. {
  69. break;
  70. }
  71. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  72. TextureOperation operation = new TextureOperation(
  73. Instruction.ImageLoad,
  74. type,
  75. flags,
  76. handle,
  77. compIndex,
  78. rd,
  79. sources);
  80. if (!op.IsBindless)
  81. {
  82. operation.Format = context.Config.GetTextureFormat(handle);
  83. }
  84. context.Add(operation);
  85. }
  86. }
  87. else
  88. {
  89. if (op.ByteAddress)
  90. {
  91. int xIndex = op.IsBindless ? 1 : 0;
  92. sources[xIndex] = context.ShiftRightS32(sources[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  93. }
  94. int components = GetComponents(op.Size);
  95. for (int compIndex = 0; compIndex < components; compIndex++)
  96. {
  97. if (rdIndex == RegisterConsts.RegisterZeroIndex)
  98. {
  99. break;
  100. }
  101. Operand rd = Register(rdIndex++, RegisterType.Gpr);
  102. TextureOperation operation = new TextureOperation(
  103. Instruction.ImageLoad,
  104. type,
  105. flags,
  106. handle,
  107. compIndex,
  108. rd,
  109. sources)
  110. {
  111. Format = GetTextureFormat(op.Size)
  112. };
  113. context.Add(operation);
  114. switch (op.Size)
  115. {
  116. case IntegerSize.U8: context.Copy(rd, ZeroExtendTo32(context, rd, 8)); break;
  117. case IntegerSize.U16: context.Copy(rd, ZeroExtendTo32(context, rd, 16)); break;
  118. case IntegerSize.S8: context.Copy(rd, SignExtendTo32(context, rd, 8)); break;
  119. case IntegerSize.S16: context.Copy(rd, SignExtendTo32(context, rd, 16)); break;
  120. }
  121. }
  122. }
  123. }
  124. public static void Sust(EmitterContext context)
  125. {
  126. OpCodeImage op = (OpCodeImage)context.CurrOp;
  127. SamplerType type = ConvertSamplerType(op.Dimensions);
  128. if (type == SamplerType.None)
  129. {
  130. context.Config.GpuAccessor.Log("Invalid image store sampler type.");
  131. return;
  132. }
  133. int raIndex = op.Ra.Index;
  134. int rbIndex = op.Rb.Index;
  135. Operand Ra()
  136. {
  137. if (raIndex > RegisterConsts.RegisterZeroIndex)
  138. {
  139. return Const(0);
  140. }
  141. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  142. }
  143. Operand Rb()
  144. {
  145. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  146. {
  147. return Const(0);
  148. }
  149. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  150. }
  151. Operand arrayIndex = type.HasFlag(SamplerType.Array) ? Ra() : null;
  152. List<Operand> sourcesList = new List<Operand>();
  153. if (op.IsBindless)
  154. {
  155. sourcesList.Add(context.Copy(Register(op.Rc)));
  156. }
  157. int coordsCount = type.GetDimensions();
  158. for (int index = 0; index < coordsCount; index++)
  159. {
  160. sourcesList.Add(Ra());
  161. }
  162. if (Sample1DAs2D && (type & SamplerType.Mask) == SamplerType.Texture1D)
  163. {
  164. sourcesList.Add(Const(0));
  165. type &= ~SamplerType.Mask;
  166. type |= SamplerType.Texture2D;
  167. }
  168. if (type.HasFlag(SamplerType.Array))
  169. {
  170. sourcesList.Add(arrayIndex);
  171. type |= SamplerType.Array;
  172. }
  173. TextureFormat format = TextureFormat.Unknown;
  174. if (op.UseComponents)
  175. {
  176. int componentMask = (int)op.Components;
  177. for (int compMask = componentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  178. {
  179. if ((compMask & 1) != 0)
  180. {
  181. sourcesList.Add(Rb());
  182. }
  183. }
  184. if (!op.IsBindless)
  185. {
  186. format = context.Config.GetTextureFormat(op.Immediate);
  187. }
  188. }
  189. else
  190. {
  191. if (op.ByteAddress)
  192. {
  193. int xIndex = op.IsBindless ? 1 : 0;
  194. sourcesList[xIndex] = context.ShiftRightS32(sourcesList[xIndex], Const(GetComponentSizeInBytesLog2(op.Size)));
  195. }
  196. int components = GetComponents(op.Size);
  197. for (int compIndex = 0; compIndex < components; compIndex++)
  198. {
  199. sourcesList.Add(Rb());
  200. }
  201. format = GetTextureFormat(op.Size);
  202. }
  203. Operand[] sources = sourcesList.ToArray();
  204. int handle = !op.IsBindless ? op.Immediate : 0;
  205. TextureFlags flags = op.IsBindless ? TextureFlags.Bindless : TextureFlags.None;
  206. TextureOperation operation = new TextureOperation(
  207. Instruction.ImageStore,
  208. type,
  209. flags,
  210. handle,
  211. 0,
  212. null,
  213. sources)
  214. {
  215. Format = format
  216. };
  217. context.Add(operation);
  218. }
  219. public static void Tex(EmitterContext context)
  220. {
  221. EmitTextureSample(context, TextureFlags.None);
  222. }
  223. public static void TexB(EmitterContext context)
  224. {
  225. EmitTextureSample(context, TextureFlags.Bindless);
  226. }
  227. public static void Tld(EmitterContext context)
  228. {
  229. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  230. EmitTextureSample(context, TextureFlags.IntCoords);
  231. }
  232. public static void TldB(EmitterContext context)
  233. {
  234. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  235. EmitTextureSample(context, TextureFlags.IntCoords | TextureFlags.Bindless);
  236. }
  237. public static void Texs(EmitterContext context)
  238. {
  239. OpCodeTextureScalar op = (OpCodeTextureScalar)context.CurrOp;
  240. if (op.Rd0.IsRZ && op.Rd1.IsRZ)
  241. {
  242. return;
  243. }
  244. List<Operand> sourcesList = new List<Operand>();
  245. int raIndex = op.Ra.Index;
  246. int rbIndex = op.Rb.Index;
  247. Operand Ra()
  248. {
  249. if (raIndex > RegisterConsts.RegisterZeroIndex)
  250. {
  251. return Const(0);
  252. }
  253. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  254. }
  255. Operand Rb()
  256. {
  257. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  258. {
  259. return Const(0);
  260. }
  261. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  262. }
  263. void AddTextureOffset(int coordsCount, int stride, int size)
  264. {
  265. Operand packedOffs = Rb();
  266. for (int index = 0; index < coordsCount; index++)
  267. {
  268. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * stride), Const(size)));
  269. }
  270. }
  271. SamplerType type;
  272. TextureFlags flags;
  273. if (op is OpCodeTexs texsOp)
  274. {
  275. type = ConvertSamplerType(texsOp.Target);
  276. if (type == SamplerType.None)
  277. {
  278. context.Config.GpuAccessor.Log("Invalid texture sampler type.");
  279. return;
  280. }
  281. flags = ConvertTextureFlags(texsOp.Target);
  282. // We don't need to handle 1D -> Buffer conversions here as
  283. // only texture sample with integer coordinates can ever use buffer targets.
  284. if ((type & SamplerType.Array) != 0)
  285. {
  286. Operand arrayIndex = Ra();
  287. sourcesList.Add(Ra());
  288. sourcesList.Add(Rb());
  289. sourcesList.Add(arrayIndex);
  290. if ((type & SamplerType.Shadow) != 0)
  291. {
  292. sourcesList.Add(Rb());
  293. }
  294. if ((flags & TextureFlags.LodLevel) != 0)
  295. {
  296. sourcesList.Add(ConstF(0));
  297. }
  298. }
  299. else
  300. {
  301. switch (texsOp.Target)
  302. {
  303. case TextureTarget.Texture1DLodZero:
  304. sourcesList.Add(Ra());
  305. if (Sample1DAs2D)
  306. {
  307. sourcesList.Add(ConstF(0));
  308. type &= ~SamplerType.Mask;
  309. type |= SamplerType.Texture2D;
  310. }
  311. sourcesList.Add(ConstF(0));
  312. break;
  313. case TextureTarget.Texture2D:
  314. sourcesList.Add(Ra());
  315. sourcesList.Add(Rb());
  316. break;
  317. case TextureTarget.Texture2DLodZero:
  318. sourcesList.Add(Ra());
  319. sourcesList.Add(Rb());
  320. sourcesList.Add(ConstF(0));
  321. break;
  322. case TextureTarget.Texture2DLodLevel:
  323. case TextureTarget.Texture2DDepthCompare:
  324. case TextureTarget.Texture3D:
  325. case TextureTarget.TextureCube:
  326. sourcesList.Add(Ra());
  327. sourcesList.Add(Ra());
  328. sourcesList.Add(Rb());
  329. break;
  330. case TextureTarget.Texture2DLodZeroDepthCompare:
  331. case TextureTarget.Texture3DLodZero:
  332. sourcesList.Add(Ra());
  333. sourcesList.Add(Ra());
  334. sourcesList.Add(Rb());
  335. sourcesList.Add(ConstF(0));
  336. break;
  337. case TextureTarget.Texture2DLodLevelDepthCompare:
  338. case TextureTarget.TextureCubeLodLevel:
  339. sourcesList.Add(Ra());
  340. sourcesList.Add(Ra());
  341. sourcesList.Add(Rb());
  342. sourcesList.Add(Rb());
  343. break;
  344. }
  345. }
  346. }
  347. else if (op is OpCodeTlds tldsOp)
  348. {
  349. type = ConvertSamplerType(tldsOp.Target);
  350. if (type == SamplerType.None)
  351. {
  352. context.Config.GpuAccessor.Log("Invalid texel fetch sampler type.");
  353. return;
  354. }
  355. context.Config.SetUsedFeature(FeatureFlags.IntegerSampling);
  356. flags = ConvertTextureFlags(tldsOp.Target) | TextureFlags.IntCoords;
  357. if (tldsOp.Target == TexelLoadTarget.Texture1DLodZero && context.Config.GpuAccessor.QueryIsTextureBuffer(tldsOp.Immediate))
  358. {
  359. type = SamplerType.TextureBuffer;
  360. flags &= ~TextureFlags.LodLevel;
  361. }
  362. switch (tldsOp.Target)
  363. {
  364. case TexelLoadTarget.Texture1DLodZero:
  365. sourcesList.Add(Ra());
  366. if (type != SamplerType.TextureBuffer)
  367. {
  368. if (Sample1DAs2D)
  369. {
  370. sourcesList.Add(ConstF(0));
  371. type &= ~SamplerType.Mask;
  372. type |= SamplerType.Texture2D;
  373. }
  374. sourcesList.Add(ConstF(0));
  375. }
  376. break;
  377. case TexelLoadTarget.Texture1DLodLevel:
  378. sourcesList.Add(Ra());
  379. if (Sample1DAs2D)
  380. {
  381. sourcesList.Add(ConstF(0));
  382. type &= ~SamplerType.Mask;
  383. type |= SamplerType.Texture2D;
  384. }
  385. sourcesList.Add(Rb());
  386. break;
  387. case TexelLoadTarget.Texture2DLodZero:
  388. sourcesList.Add(Ra());
  389. sourcesList.Add(Rb());
  390. sourcesList.Add(Const(0));
  391. break;
  392. case TexelLoadTarget.Texture2DLodZeroOffset:
  393. sourcesList.Add(Ra());
  394. sourcesList.Add(Ra());
  395. sourcesList.Add(Const(0));
  396. break;
  397. case TexelLoadTarget.Texture2DLodZeroMultisample:
  398. case TexelLoadTarget.Texture2DLodLevel:
  399. case TexelLoadTarget.Texture2DLodLevelOffset:
  400. sourcesList.Add(Ra());
  401. sourcesList.Add(Ra());
  402. sourcesList.Add(Rb());
  403. break;
  404. case TexelLoadTarget.Texture3DLodZero:
  405. sourcesList.Add(Ra());
  406. sourcesList.Add(Ra());
  407. sourcesList.Add(Rb());
  408. sourcesList.Add(Const(0));
  409. break;
  410. case TexelLoadTarget.Texture2DArrayLodZero:
  411. sourcesList.Add(Rb());
  412. sourcesList.Add(Rb());
  413. sourcesList.Add(Ra());
  414. sourcesList.Add(Const(0));
  415. break;
  416. }
  417. if ((flags & TextureFlags.Offset) != 0)
  418. {
  419. AddTextureOffset(type.GetDimensions(), 4, 4);
  420. }
  421. }
  422. else if (op is OpCodeTld4s tld4sOp)
  423. {
  424. if (!(tld4sOp.HasDepthCompare || tld4sOp.HasOffset))
  425. {
  426. sourcesList.Add(Ra());
  427. sourcesList.Add(Rb());
  428. }
  429. else
  430. {
  431. sourcesList.Add(Ra());
  432. sourcesList.Add(Ra());
  433. }
  434. type = SamplerType.Texture2D;
  435. flags = TextureFlags.Gather;
  436. if (tld4sOp.HasDepthCompare)
  437. {
  438. sourcesList.Add(Rb());
  439. type |= SamplerType.Shadow;
  440. }
  441. if (tld4sOp.HasOffset)
  442. {
  443. AddTextureOffset(type.GetDimensions(), 8, 6);
  444. flags |= TextureFlags.Offset;
  445. }
  446. sourcesList.Add(Const(tld4sOp.GatherCompIndex));
  447. }
  448. else
  449. {
  450. throw new InvalidOperationException($"Invalid opcode type \"{op.GetType().Name}\".");
  451. }
  452. Operand[] sources = sourcesList.ToArray();
  453. Operand[] rd0 = new Operand[2] { ConstF(0), ConstF(0) };
  454. Operand[] rd1 = new Operand[2] { ConstF(0), ConstF(0) };
  455. int destIncrement = 0;
  456. Operand GetDest()
  457. {
  458. int high = destIncrement >> 1;
  459. int low = destIncrement & 1;
  460. destIncrement++;
  461. if (op.IsFp16)
  462. {
  463. return high != 0
  464. ? (rd1[low] = Local())
  465. : (rd0[low] = Local());
  466. }
  467. else
  468. {
  469. int rdIndex = high != 0 ? op.Rd1.Index : op.Rd0.Index;
  470. if (rdIndex < RegisterConsts.RegisterZeroIndex)
  471. {
  472. rdIndex += low;
  473. }
  474. return Register(rdIndex, RegisterType.Gpr);
  475. }
  476. }
  477. int handle = op.Immediate;
  478. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  479. {
  480. if ((compMask & 1) != 0)
  481. {
  482. Operand dest = GetDest();
  483. TextureOperation operation = new TextureOperation(
  484. Instruction.TextureSample,
  485. type,
  486. flags,
  487. handle,
  488. compIndex,
  489. dest,
  490. sources);
  491. context.Add(operation);
  492. }
  493. }
  494. if (op.IsFp16)
  495. {
  496. context.Copy(Register(op.Rd0), context.PackHalf2x16(rd0[0], rd0[1]));
  497. context.Copy(Register(op.Rd1), context.PackHalf2x16(rd1[0], rd1[1]));
  498. }
  499. }
  500. public static void Tld4(EmitterContext context)
  501. {
  502. IOpCodeTld4 op = (IOpCodeTld4)context.CurrOp;
  503. if (op.Rd.IsRZ)
  504. {
  505. return;
  506. }
  507. int raIndex = op.Ra.Index;
  508. int rbIndex = op.Rb.Index;
  509. Operand Ra()
  510. {
  511. if (raIndex > RegisterConsts.RegisterZeroIndex)
  512. {
  513. return Const(0);
  514. }
  515. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  516. }
  517. Operand Rb()
  518. {
  519. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  520. {
  521. return Const(0);
  522. }
  523. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  524. }
  525. Operand arrayIndex = op.IsArray ? Ra() : null;
  526. List<Operand> sourcesList = new List<Operand>();
  527. SamplerType type = ConvertSamplerType(op.Dimensions);
  528. TextureFlags flags = TextureFlags.Gather;
  529. if (op.Bindless)
  530. {
  531. sourcesList.Add(Rb());
  532. flags |= TextureFlags.Bindless;
  533. }
  534. int coordsCount = type.GetDimensions();
  535. for (int index = 0; index < coordsCount; index++)
  536. {
  537. sourcesList.Add(Ra());
  538. }
  539. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  540. if (is1DTo2D)
  541. {
  542. sourcesList.Add(ConstF(0));
  543. type = SamplerType.Texture2D;
  544. }
  545. if (op.IsArray)
  546. {
  547. sourcesList.Add(arrayIndex);
  548. type |= SamplerType.Array;
  549. }
  550. Operand[] packedOffs = new Operand[2];
  551. packedOffs[0] = op.Offset != TextureGatherOffset.None ? Rb() : null;
  552. packedOffs[1] = op.Offset == TextureGatherOffset.Offsets ? Rb() : null;
  553. if (op.HasDepthCompare)
  554. {
  555. sourcesList.Add(Rb());
  556. type |= SamplerType.Shadow;
  557. }
  558. if (op.Offset != TextureGatherOffset.None)
  559. {
  560. int offsetTexelsCount = op.Offset == TextureGatherOffset.Offsets ? 4 : 1;
  561. for (int index = 0; index < coordsCount * offsetTexelsCount; index++)
  562. {
  563. Operand packed = packedOffs[(index >> 2) & 1];
  564. sourcesList.Add(context.BitfieldExtractS32(packed, Const((index & 3) * 8), Const(6)));
  565. }
  566. if (is1DTo2D)
  567. {
  568. for (int index = 0; index < offsetTexelsCount; index++)
  569. {
  570. sourcesList.Add(Const(0));
  571. }
  572. }
  573. flags |= op.Offset == TextureGatherOffset.Offsets
  574. ? TextureFlags.Offsets
  575. : TextureFlags.Offset;
  576. }
  577. sourcesList.Add(Const(op.GatherCompIndex));
  578. Operand[] sources = sourcesList.ToArray();
  579. int rdIndex = op.Rd.Index;
  580. Operand GetDest()
  581. {
  582. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  583. {
  584. return Const(0);
  585. }
  586. return Register(rdIndex++, RegisterType.Gpr);
  587. }
  588. int handle = op.Immediate;
  589. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  590. {
  591. if ((compMask & 1) != 0)
  592. {
  593. Operand dest = GetDest();
  594. TextureOperation operation = new TextureOperation(
  595. Instruction.TextureSample,
  596. type,
  597. flags,
  598. handle,
  599. compIndex,
  600. dest,
  601. sources);
  602. context.Add(operation);
  603. }
  604. }
  605. }
  606. public static void TmmlB(EmitterContext context)
  607. {
  608. EmitTextureMipMapLevel(context, true);
  609. }
  610. public static void Tmml(EmitterContext context)
  611. {
  612. EmitTextureMipMapLevel(context, false);
  613. }
  614. private static void EmitTextureMipMapLevel(EmitterContext context, bool isBindless)
  615. {
  616. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  617. if (op.Rd.IsRZ)
  618. {
  619. return;
  620. }
  621. int raIndex = op.Ra.Index;
  622. int rbIndex = op.Rb.Index;
  623. Operand Ra()
  624. {
  625. if (raIndex > RegisterConsts.RegisterZeroIndex)
  626. {
  627. return Const(0);
  628. }
  629. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  630. }
  631. Operand Rb()
  632. {
  633. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  634. {
  635. return Const(0);
  636. }
  637. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  638. }
  639. TextureFlags flags = TextureFlags.None;
  640. List<Operand> sourcesList = new List<Operand>();
  641. if (isBindless)
  642. {
  643. sourcesList.Add(Rb());
  644. flags |= TextureFlags.Bindless;
  645. }
  646. SamplerType type = ConvertSamplerType(op.Dimensions);
  647. int coordsCount = type.GetDimensions();
  648. Operand arrayIndex = op.IsArray ? Ra() : null;
  649. for (int index = 0; index < coordsCount; index++)
  650. {
  651. sourcesList.Add(Ra());
  652. }
  653. if (Sample1DAs2D && type == SamplerType.Texture1D)
  654. {
  655. sourcesList.Add(ConstF(0));
  656. type = SamplerType.Texture2D;
  657. }
  658. if (op.IsArray)
  659. {
  660. sourcesList.Add(arrayIndex);
  661. type |= SamplerType.Array;
  662. }
  663. Operand[] sources = sourcesList.ToArray();
  664. int rdIndex = op.Rd.Index;
  665. Operand GetDest()
  666. {
  667. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  668. {
  669. return Const(0);
  670. }
  671. return Register(rdIndex++, RegisterType.Gpr);
  672. }
  673. int handle = !isBindless ? op.Immediate : 0;
  674. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  675. {
  676. if ((compMask & 1) != 0)
  677. {
  678. Operand dest = GetDest();
  679. // Components z and w aren't standard, we return 0 in this case and add a comment.
  680. if (compIndex >= 2)
  681. {
  682. context.Add(new CommentNode("Unsupported component z or w found"));
  683. context.Copy(dest, Const(0));
  684. }
  685. else
  686. {
  687. Operand tempDest = Local();
  688. TextureOperation operation = new TextureOperation(
  689. Instruction.Lod,
  690. type,
  691. flags,
  692. handle,
  693. compIndex,
  694. tempDest,
  695. sources);
  696. context.Add(operation);
  697. tempDest = context.FPMultiply(tempDest, ConstF(256.0f));
  698. Operand finalValue = context.FPConvertToS32(tempDest);
  699. context.Copy(dest, finalValue);
  700. }
  701. }
  702. }
  703. }
  704. public static void Txd(EmitterContext context)
  705. {
  706. OpCodeTxd op = (OpCodeTxd)context.CurrOp;
  707. if (op.Rd.IsRZ)
  708. {
  709. return;
  710. }
  711. int raIndex = op.Ra.Index;
  712. int rbIndex = op.Rb.Index;
  713. Operand Ra()
  714. {
  715. if (raIndex > RegisterConsts.RegisterZeroIndex)
  716. {
  717. return Const(0);
  718. }
  719. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  720. }
  721. Operand Rb()
  722. {
  723. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  724. {
  725. return Const(0);
  726. }
  727. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  728. }
  729. TextureFlags flags = TextureFlags.Derivatives;
  730. List<Operand> sourcesList = new List<Operand>();
  731. if (op.IsBindless)
  732. {
  733. sourcesList.Add(Ra());
  734. flags |= TextureFlags.Bindless;
  735. }
  736. SamplerType type = ConvertSamplerType(op.Dimensions);
  737. int coordsCount = type.GetDimensions();
  738. for (int index = 0; index < coordsCount; index++)
  739. {
  740. sourcesList.Add(Ra());
  741. }
  742. bool is1DTo2D = Sample1DAs2D && type == SamplerType.Texture1D;
  743. if (is1DTo2D)
  744. {
  745. sourcesList.Add(ConstF(0));
  746. type = SamplerType.Texture2D;
  747. }
  748. Operand packedParams = Ra();
  749. if (op.IsArray)
  750. {
  751. sourcesList.Add(context.BitwiseAnd(packedParams, Const(0xffff)));
  752. type |= SamplerType.Array;
  753. }
  754. // Derivatives (X and Y).
  755. for (int dIndex = 0; dIndex < 2 * coordsCount; dIndex++)
  756. {
  757. sourcesList.Add(Rb());
  758. if (is1DTo2D)
  759. {
  760. sourcesList.Add(ConstF(0));
  761. }
  762. }
  763. if (op.HasOffset)
  764. {
  765. for (int index = 0; index < coordsCount; index++)
  766. {
  767. sourcesList.Add(context.BitfieldExtractS32(packedParams, Const(16 + index * 4), Const(4)));
  768. }
  769. if (is1DTo2D)
  770. {
  771. sourcesList.Add(Const(0));
  772. }
  773. flags |= TextureFlags.Offset;
  774. }
  775. Operand[] sources = sourcesList.ToArray();
  776. int rdIndex = op.Rd.Index;
  777. Operand GetDest()
  778. {
  779. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  780. {
  781. return Const(0);
  782. }
  783. return Register(rdIndex++, RegisterType.Gpr);
  784. }
  785. int handle = !op.IsBindless ? op.Immediate : 0;
  786. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  787. {
  788. if ((compMask & 1) != 0)
  789. {
  790. Operand dest = GetDest();
  791. TextureOperation operation = new TextureOperation(
  792. Instruction.TextureSample,
  793. type,
  794. flags,
  795. handle,
  796. compIndex,
  797. dest,
  798. sources);
  799. context.Add(operation);
  800. }
  801. }
  802. }
  803. public static void Txq(EmitterContext context)
  804. {
  805. EmitTextureQuery(context, bindless: false);
  806. }
  807. public static void TxqB(EmitterContext context)
  808. {
  809. EmitTextureQuery(context, bindless: true);
  810. }
  811. private static void EmitTextureQuery(EmitterContext context, bool bindless)
  812. {
  813. OpCodeTex op = (OpCodeTex)context.CurrOp;
  814. if (op.Rd.IsRZ)
  815. {
  816. return;
  817. }
  818. TextureProperty property = (TextureProperty)op.RawOpCode.Extract(22, 6);
  819. // TODO: Validate and use property.
  820. Instruction inst = Instruction.TextureSize;
  821. SamplerType type = SamplerType.Texture2D;
  822. TextureFlags flags = bindless ? TextureFlags.Bindless : TextureFlags.None;
  823. int raIndex = op.Ra.Index;
  824. Operand Ra()
  825. {
  826. if (raIndex > RegisterConsts.RegisterZeroIndex)
  827. {
  828. return Const(0);
  829. }
  830. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  831. }
  832. List<Operand> sourcesList = new List<Operand>();
  833. if (bindless)
  834. {
  835. sourcesList.Add(Ra());
  836. }
  837. sourcesList.Add(Ra());
  838. Operand[] sources = sourcesList.ToArray();
  839. int rdIndex = op.Rd.Index;
  840. Operand GetDest()
  841. {
  842. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  843. {
  844. return Const(0);
  845. }
  846. return Register(rdIndex++, RegisterType.Gpr);
  847. }
  848. int handle = !bindless ? op.Immediate : 0;
  849. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  850. {
  851. if ((compMask & 1) != 0)
  852. {
  853. Operand dest = GetDest();
  854. TextureOperation operation = new TextureOperation(
  855. inst,
  856. type,
  857. flags,
  858. handle,
  859. compIndex,
  860. dest,
  861. sources);
  862. context.Add(operation);
  863. }
  864. }
  865. }
  866. private static void EmitTextureSample(EmitterContext context, TextureFlags flags)
  867. {
  868. OpCodeTexture op = (OpCodeTexture)context.CurrOp;
  869. bool isBindless = (flags & TextureFlags.Bindless) != 0;
  870. if (op.Rd.IsRZ)
  871. {
  872. return;
  873. }
  874. int raIndex = op.Ra.Index;
  875. int rbIndex = op.Rb.Index;
  876. Operand Ra()
  877. {
  878. if (raIndex > RegisterConsts.RegisterZeroIndex)
  879. {
  880. return Const(0);
  881. }
  882. return context.Copy(Register(raIndex++, RegisterType.Gpr));
  883. }
  884. Operand Rb()
  885. {
  886. if (rbIndex > RegisterConsts.RegisterZeroIndex)
  887. {
  888. return Const(0);
  889. }
  890. return context.Copy(Register(rbIndex++, RegisterType.Gpr));
  891. }
  892. Operand arrayIndex = op.IsArray ? Ra() : null;
  893. List<Operand> sourcesList = new List<Operand>();
  894. if (isBindless)
  895. {
  896. sourcesList.Add(Rb());
  897. }
  898. SamplerType type = ConvertSamplerType(op.Dimensions);
  899. bool hasLod = op.LodMode > TextureLodMode.LodZero;
  900. if (type == SamplerType.Texture1D && (flags & ~TextureFlags.Bindless) == TextureFlags.IntCoords && !(hasLod ||
  901. op.HasDepthCompare ||
  902. op.HasOffset ||
  903. op.IsArray ||
  904. op.IsMultisample))
  905. {
  906. // For bindless, we don't have any way to know the texture type,
  907. // so we assume it's texture buffer when the sampler type is 1D, since that's more common.
  908. bool isTypeBuffer = isBindless || context.Config.GpuAccessor.QueryIsTextureBuffer(op.Immediate);
  909. if (isTypeBuffer)
  910. {
  911. type = SamplerType.TextureBuffer;
  912. }
  913. }
  914. int coordsCount = type.GetDimensions();
  915. for (int index = 0; index < coordsCount; index++)
  916. {
  917. sourcesList.Add(Ra());
  918. }
  919. if (Sample1DAs2D && type == SamplerType.Texture1D)
  920. {
  921. sourcesList.Add(ConstF(0));
  922. type = SamplerType.Texture2D;
  923. }
  924. if (op.IsArray)
  925. {
  926. sourcesList.Add(arrayIndex);
  927. type |= SamplerType.Array;
  928. }
  929. Operand lodValue = hasLod ? Rb() : ConstF(0);
  930. Operand packedOffs = op.HasOffset ? Rb() : null;
  931. if (op.HasDepthCompare)
  932. {
  933. sourcesList.Add(Rb());
  934. type |= SamplerType.Shadow;
  935. }
  936. if ((op.LodMode == TextureLodMode.LodZero ||
  937. op.LodMode == TextureLodMode.LodLevel ||
  938. op.LodMode == TextureLodMode.LodLevelA) && !op.IsMultisample && type != SamplerType.TextureBuffer)
  939. {
  940. sourcesList.Add(lodValue);
  941. flags |= TextureFlags.LodLevel;
  942. }
  943. if (op.HasOffset)
  944. {
  945. for (int index = 0; index < coordsCount; index++)
  946. {
  947. sourcesList.Add(context.BitfieldExtractS32(packedOffs, Const(index * 4), Const(4)));
  948. }
  949. flags |= TextureFlags.Offset;
  950. }
  951. if (op.LodMode == TextureLodMode.LodBias ||
  952. op.LodMode == TextureLodMode.LodBiasA)
  953. {
  954. sourcesList.Add(lodValue);
  955. flags |= TextureFlags.LodBias;
  956. }
  957. if (op.IsMultisample)
  958. {
  959. sourcesList.Add(Rb());
  960. type |= SamplerType.Multisample;
  961. }
  962. Operand[] sources = sourcesList.ToArray();
  963. int rdIndex = op.Rd.Index;
  964. Operand GetDest()
  965. {
  966. if (rdIndex > RegisterConsts.RegisterZeroIndex)
  967. {
  968. return Const(0);
  969. }
  970. return Register(rdIndex++, RegisterType.Gpr);
  971. }
  972. int handle = !isBindless ? op.Immediate : 0;
  973. for (int compMask = op.ComponentMask, compIndex = 0; compMask != 0; compMask >>= 1, compIndex++)
  974. {
  975. if ((compMask & 1) != 0)
  976. {
  977. Operand dest = GetDest();
  978. TextureOperation operation = new TextureOperation(
  979. Instruction.TextureSample,
  980. type,
  981. flags,
  982. handle,
  983. compIndex,
  984. dest,
  985. sources);
  986. context.Add(operation);
  987. }
  988. }
  989. }
  990. private static int GetComponents(IntegerSize size)
  991. {
  992. return size switch
  993. {
  994. IntegerSize.B64 => 2,
  995. IntegerSize.B128 => 4,
  996. IntegerSize.UB128 => 4,
  997. _ => 1
  998. };
  999. }
  1000. private static int GetComponentSizeInBytesLog2(IntegerSize size)
  1001. {
  1002. return size switch
  1003. {
  1004. IntegerSize.U8 => 0,
  1005. IntegerSize.S8 => 0,
  1006. IntegerSize.U16 => 1,
  1007. IntegerSize.S16 => 1,
  1008. IntegerSize.B32 => 2,
  1009. IntegerSize.B64 => 3,
  1010. IntegerSize.B128 => 4,
  1011. IntegerSize.UB128 => 4,
  1012. _ => 2
  1013. };
  1014. }
  1015. private static TextureFormat GetTextureFormat(IntegerSize size)
  1016. {
  1017. return size switch
  1018. {
  1019. IntegerSize.U8 => TextureFormat.R8Uint,
  1020. IntegerSize.S8 => TextureFormat.R8Sint,
  1021. IntegerSize.U16 => TextureFormat.R16Uint,
  1022. IntegerSize.S16 => TextureFormat.R16Sint,
  1023. IntegerSize.B32 => TextureFormat.R32Uint,
  1024. IntegerSize.B64 => TextureFormat.R32G32Uint,
  1025. IntegerSize.B128 => TextureFormat.R32G32B32A32Uint,
  1026. IntegerSize.UB128 => TextureFormat.R32G32B32A32Uint,
  1027. _ => TextureFormat.R32Uint
  1028. };
  1029. }
  1030. private static SamplerType ConvertSamplerType(ImageDimensions target)
  1031. {
  1032. return target switch
  1033. {
  1034. ImageDimensions.Image1D => SamplerType.Texture1D,
  1035. ImageDimensions.ImageBuffer => SamplerType.TextureBuffer,
  1036. ImageDimensions.Image1DArray => SamplerType.Texture1D | SamplerType.Array,
  1037. ImageDimensions.Image2D => SamplerType.Texture2D,
  1038. ImageDimensions.Image2DArray => SamplerType.Texture2D | SamplerType.Array,
  1039. ImageDimensions.Image3D => SamplerType.Texture3D,
  1040. _ => SamplerType.None
  1041. };
  1042. }
  1043. private static SamplerType ConvertSamplerType(TextureDimensions dimensions)
  1044. {
  1045. return dimensions switch
  1046. {
  1047. TextureDimensions.Texture1D => SamplerType.Texture1D,
  1048. TextureDimensions.Texture2D => SamplerType.Texture2D,
  1049. TextureDimensions.Texture3D => SamplerType.Texture3D,
  1050. TextureDimensions.TextureCube => SamplerType.TextureCube,
  1051. _ => throw new ArgumentException($"Invalid texture dimensions \"{dimensions}\".")
  1052. };
  1053. }
  1054. private static SamplerType ConvertSamplerType(TextureTarget type)
  1055. {
  1056. switch (type)
  1057. {
  1058. case TextureTarget.Texture1DLodZero:
  1059. return SamplerType.Texture1D;
  1060. case TextureTarget.Texture2D:
  1061. case TextureTarget.Texture2DLodZero:
  1062. case TextureTarget.Texture2DLodLevel:
  1063. return SamplerType.Texture2D;
  1064. case TextureTarget.Texture2DDepthCompare:
  1065. case TextureTarget.Texture2DLodLevelDepthCompare:
  1066. case TextureTarget.Texture2DLodZeroDepthCompare:
  1067. return SamplerType.Texture2D | SamplerType.Shadow;
  1068. case TextureTarget.Texture2DArray:
  1069. case TextureTarget.Texture2DArrayLodZero:
  1070. return SamplerType.Texture2D | SamplerType.Array;
  1071. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1072. return SamplerType.Texture2D | SamplerType.Array | SamplerType.Shadow;
  1073. case TextureTarget.Texture3D:
  1074. case TextureTarget.Texture3DLodZero:
  1075. return SamplerType.Texture3D;
  1076. case TextureTarget.TextureCube:
  1077. case TextureTarget.TextureCubeLodLevel:
  1078. return SamplerType.TextureCube;
  1079. }
  1080. return SamplerType.None;
  1081. }
  1082. private static SamplerType ConvertSamplerType(TexelLoadTarget type)
  1083. {
  1084. switch (type)
  1085. {
  1086. case TexelLoadTarget.Texture1DLodZero:
  1087. case TexelLoadTarget.Texture1DLodLevel:
  1088. return SamplerType.Texture1D;
  1089. case TexelLoadTarget.Texture2DLodZero:
  1090. case TexelLoadTarget.Texture2DLodZeroOffset:
  1091. case TexelLoadTarget.Texture2DLodLevel:
  1092. case TexelLoadTarget.Texture2DLodLevelOffset:
  1093. return SamplerType.Texture2D;
  1094. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1095. return SamplerType.Texture2D | SamplerType.Multisample;
  1096. case TexelLoadTarget.Texture3DLodZero:
  1097. return SamplerType.Texture3D;
  1098. case TexelLoadTarget.Texture2DArrayLodZero:
  1099. return SamplerType.Texture2D | SamplerType.Array;
  1100. }
  1101. return SamplerType.None;
  1102. }
  1103. private static TextureFlags ConvertTextureFlags(TextureTarget type)
  1104. {
  1105. switch (type)
  1106. {
  1107. case TextureTarget.Texture1DLodZero:
  1108. case TextureTarget.Texture2DLodZero:
  1109. case TextureTarget.Texture2DLodLevel:
  1110. case TextureTarget.Texture2DLodLevelDepthCompare:
  1111. case TextureTarget.Texture2DLodZeroDepthCompare:
  1112. case TextureTarget.Texture2DArrayLodZero:
  1113. case TextureTarget.Texture2DArrayLodZeroDepthCompare:
  1114. case TextureTarget.Texture3DLodZero:
  1115. case TextureTarget.TextureCubeLodLevel:
  1116. return TextureFlags.LodLevel;
  1117. case TextureTarget.Texture2D:
  1118. case TextureTarget.Texture2DDepthCompare:
  1119. case TextureTarget.Texture2DArray:
  1120. case TextureTarget.Texture3D:
  1121. case TextureTarget.TextureCube:
  1122. return TextureFlags.None;
  1123. }
  1124. return TextureFlags.None;
  1125. }
  1126. private static TextureFlags ConvertTextureFlags(TexelLoadTarget type)
  1127. {
  1128. switch (type)
  1129. {
  1130. case TexelLoadTarget.Texture1DLodZero:
  1131. case TexelLoadTarget.Texture1DLodLevel:
  1132. case TexelLoadTarget.Texture2DLodZero:
  1133. case TexelLoadTarget.Texture2DLodLevel:
  1134. case TexelLoadTarget.Texture2DLodZeroMultisample:
  1135. case TexelLoadTarget.Texture3DLodZero:
  1136. case TexelLoadTarget.Texture2DArrayLodZero:
  1137. return TextureFlags.LodLevel;
  1138. case TexelLoadTarget.Texture2DLodZeroOffset:
  1139. case TexelLoadTarget.Texture2DLodLevelOffset:
  1140. return TextureFlags.LodLevel | TextureFlags.Offset;
  1141. }
  1142. return TextureFlags.None;
  1143. }
  1144. }
  1145. }