| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581 |
- using ChocolArm64.Memory;
- using Ryujinx.Graphics.Gal;
- using System;
- using System.Collections.Generic;
- namespace Ryujinx.Graphics.Gpu
- {
- public class NvGpuEngine3d : INvGpuEngine
- {
- public int[] Registers { get; private set; }
- private NsGpu Gpu;
- private Dictionary<int, NvGpuMethod> Methods;
- private struct ConstBuffer
- {
- public bool Enabled;
- public long Position;
- public int Size;
- }
- private ConstBuffer[] ConstBuffers;
- private HashSet<long> FrameBuffers;
- public NvGpuEngine3d(NsGpu Gpu)
- {
- this.Gpu = Gpu;
- Registers = new int[0xe00];
- Methods = new Dictionary<int, NvGpuMethod>();
- void AddMethod(int Meth, int Count, int Stride, NvGpuMethod Method)
- {
- while (Count-- > 0)
- {
- Methods.Add(Meth, Method);
- Meth += Stride;
- }
- }
- AddMethod(0x585, 1, 1, VertexEndGl);
- AddMethod(0x674, 1, 1, ClearBuffers);
- AddMethod(0x6c3, 1, 1, QueryControl);
- AddMethod(0x8e4, 16, 1, CbData);
- AddMethod(0x904, 1, 1, CbBind);
- ConstBuffers = new ConstBuffer[18];
- FrameBuffers = new HashSet<long>();
- }
- public void CallMethod(AMemory Memory, NsGpuPBEntry PBEntry)
- {
- if (Methods.TryGetValue(PBEntry.Method, out NvGpuMethod Method))
- {
- Method(Memory, PBEntry);
- }
- else
- {
- WriteRegister(PBEntry);
- }
- }
- private void VertexEndGl(AMemory Memory, NsGpuPBEntry PBEntry)
- {
- SetFrameBuffer(0);
- long[] Tags = UploadShaders(Memory);
- Gpu.Renderer.BindProgram();
- SetAlphaBlending();
- UploadTextures(Memory, Tags);
- UploadUniforms(Memory);
- UploadVertexArrays(Memory);
- }
- private void ClearBuffers(AMemory Memory, NsGpuPBEntry PBEntry)
- {
- int Arg0 = PBEntry.Arguments[0];
- int FbIndex = (Arg0 >> 6) & 0xf;
- int Layer = (Arg0 >> 10) & 0x3ff;
- GalClearBufferFlags Flags = (GalClearBufferFlags)(Arg0 & 0x3f);
- SetFrameBuffer(0);
- //TODO: Enable this once the frame buffer problems are fixed.
- //Gpu.Renderer.ClearBuffers(Layer, Flags);
- }
- private void SetFrameBuffer(int FbIndex)
- {
- long Address = MakeInt64From2xInt32(NvGpuEngine3dReg.FrameBufferNAddress + FbIndex * 0x10);
- FrameBuffers.Add(Address);
- int Width = ReadRegister(NvGpuEngine3dReg.FrameBufferNWidth + FbIndex * 0x10);
- int Height = ReadRegister(NvGpuEngine3dReg.FrameBufferNHeight + FbIndex * 0x10);
- //Note: Using the Width/Height results seems to give incorrect results.
- //Maybe the size of all frame buffers is hardcoded to screen size? This seems unlikely.
- Gpu.Renderer.CreateFrameBuffer(Address, 1280, 720);
- Gpu.Renderer.BindFrameBuffer(Address);
- }
- private long[] UploadShaders(AMemory Memory)
- {
- long[] Tags = new long[5];
- long BasePosition = MakeInt64From2xInt32(NvGpuEngine3dReg.ShaderAddress);
- for (int Index = 0; Index < 6; Index++)
- {
- int Control = ReadRegister(NvGpuEngine3dReg.ShaderNControl + Index * 0x10);
- int Offset = ReadRegister(NvGpuEngine3dReg.ShaderNOffset + Index * 0x10);
- //Note: Vertex Program (B) is always enabled.
- bool Enable = (Control & 1) != 0 || Index == 1;
- if (!Enable)
- {
- continue;
- }
- long Tag = BasePosition + (uint)Offset;
- long Position = Gpu.GetCpuAddr(Tag);
- //TODO: Find a better way to calculate the size.
- int Size = 0x20000;
- byte[] Code = AMemoryHelper.ReadBytes(Memory, Position, (uint)Size);
- GalShaderType ShaderType = GetTypeFromProgram(Index);
- Tags[(int)ShaderType] = Tag;
- Gpu.Renderer.CreateShader(Tag, ShaderType, Code);
- Gpu.Renderer.BindShader(Tag);
- }
- int RawSX = ReadRegister(NvGpuEngine3dReg.ViewportScaleX);
- int RawSY = ReadRegister(NvGpuEngine3dReg.ViewportScaleY);
- float SX = BitConverter.Int32BitsToSingle(RawSX);
- float SY = BitConverter.Int32BitsToSingle(RawSY);
- float SignX = MathF.Sign(SX);
- float SignY = MathF.Sign(SY);
- Gpu.Renderer.SetUniform2F(GalConsts.FlipUniformName, SignX, SignY);
- return Tags;
- }
- private static GalShaderType GetTypeFromProgram(int Program)
- {
- switch (Program)
- {
- case 0:
- case 1: return GalShaderType.Vertex;
- case 2: return GalShaderType.TessControl;
- case 3: return GalShaderType.TessEvaluation;
- case 4: return GalShaderType.Geometry;
- case 5: return GalShaderType.Fragment;
- }
- throw new ArgumentOutOfRangeException(nameof(Program));
- }
- private void SetAlphaBlending()
- {
- //TODO: Support independent blend properly.
- bool Enable = (ReadRegister(NvGpuEngine3dReg.IBlendNEnable) & 1) != 0;
- Gpu.Renderer.SetBlendEnable(Enable);
- bool BlendSeparateAlpha = (ReadRegister(NvGpuEngine3dReg.IBlendNSeparateAlpha) & 1) != 0;
- GalBlendEquation EquationRgb = (GalBlendEquation)ReadRegister(NvGpuEngine3dReg.IBlendNEquationRgb);
- GalBlendFactor FuncSrcRgb = (GalBlendFactor)ReadRegister(NvGpuEngine3dReg.IBlendNFuncSrcRgb);
- GalBlendFactor FuncDstRgb = (GalBlendFactor)ReadRegister(NvGpuEngine3dReg.IBlendNFuncDstRgb);
- if (BlendSeparateAlpha)
- {
- GalBlendEquation EquationAlpha = (GalBlendEquation)ReadRegister(NvGpuEngine3dReg.IBlendNEquationAlpha);
- GalBlendFactor FuncSrcAlpha = (GalBlendFactor)ReadRegister(NvGpuEngine3dReg.IBlendNFuncSrcAlpha);
- GalBlendFactor FuncDstAlpha = (GalBlendFactor)ReadRegister(NvGpuEngine3dReg.IBlendNFuncDstAlpha);
- Gpu.Renderer.SetBlendSeparate(
- EquationRgb,
- EquationAlpha,
- FuncSrcRgb,
- FuncDstRgb,
- FuncSrcAlpha,
- FuncDstAlpha);
- }
- else
- {
- Gpu.Renderer.SetBlend(EquationRgb, FuncSrcRgb, FuncDstRgb);
- }
- }
- private void UploadTextures(AMemory Memory, long[] Tags)
- {
- long BaseShPosition = MakeInt64From2xInt32(NvGpuEngine3dReg.ShaderAddress);
- int TextureCbIndex = ReadRegister(NvGpuEngine3dReg.TextureCbIndex);
- long BasePosition = ConstBuffers[TextureCbIndex].Position;
- long Size = (uint)ConstBuffers[TextureCbIndex].Size;
- //Note: On the emulator renderer, Texture Unit 0 is
- //reserved for drawing the frame buffer.
- int TexIndex = 1;
- for (int Index = 0; Index < Tags.Length; Index++)
- {
- foreach (ShaderDeclInfo DeclInfo in Gpu.Renderer.GetTextureUsage(Tags[Index]))
- {
- long Position = BasePosition + Index * Size;
- UploadTexture(Memory, Position, TexIndex, DeclInfo.Index);
- Gpu.Renderer.SetUniform1(DeclInfo.Name, TexIndex);
- TexIndex++;
- }
- }
- }
- private void UploadTexture(AMemory Memory, long BasePosition, int TexIndex, int HndIndex)
- {
- long Position = BasePosition + HndIndex * 4;
- int TextureHandle = Memory.ReadInt32(Position);
- int TicIndex = (TextureHandle >> 0) & 0xfffff;
- int TscIndex = (TextureHandle >> 20) & 0xfff;
- TryGetCpuAddr(NvGpuEngine3dReg.TexHeaderPoolOffset, out long TicPosition);
- TryGetCpuAddr(NvGpuEngine3dReg.TexSamplerPoolOffset, out long TscPosition);
- TicPosition += TicIndex * 0x20;
- TscPosition += TscIndex * 0x20;
- GalTextureSampler Sampler = TextureFactory.MakeSampler(Gpu, Memory, TscPosition);
- long TextureAddress = Memory.ReadInt64(TicPosition + 4) & 0xffffffffffff;
- if (FrameBuffers.Contains(TextureAddress))
- {
- //This texture is a frame buffer texture,
- //we shouldn't read anything from memory and bind
- //the frame buffer texture instead, since we're not
- //really writing anything to memory.
- Gpu.Renderer.BindFrameBufferTexture(TextureAddress, TexIndex, Sampler);
- }
- else
- {
- GalTexture Texture = TextureFactory.MakeTexture(Gpu, Memory, TicPosition);
- Gpu.Renderer.SetTextureAndSampler(TexIndex, Texture, Sampler);
- Gpu.Renderer.BindTexture(TexIndex);
- }
- }
- private void UploadUniforms(AMemory Memory)
- {
- long BasePosition = MakeInt64From2xInt32(NvGpuEngine3dReg.ShaderAddress);
- for (int Index = 0; Index < 5; Index++)
- {
- int Control = ReadRegister(NvGpuEngine3dReg.ShaderNControl + (Index + 1) * 0x10);
- int Offset = ReadRegister(NvGpuEngine3dReg.ShaderNOffset + (Index + 1) * 0x10);
- //Note: Vertex Program (B) is always enabled.
- bool Enable = (Control & 1) != 0 || Index == 0;
- if (!Enable)
- {
- continue;
- }
- for (int Cbuf = 0; Cbuf < ConstBuffers.Length; Cbuf++)
- {
- ConstBuffer Cb = ConstBuffers[Cbuf];
- if (Cb.Enabled)
- {
- long CbPosition = Cb.Position + Index * Cb.Size;
- byte[] Data = AMemoryHelper.ReadBytes(Memory, CbPosition, (uint)Cb.Size);
- Gpu.Renderer.SetConstBuffer(BasePosition + (uint)Offset, Cbuf, Data);
- }
- }
- }
- }
- private void UploadVertexArrays(AMemory Memory)
- {
- long IndexPosition = MakeInt64From2xInt32(NvGpuEngine3dReg.IndexArrayAddress);
- int IndexSize = ReadRegister(NvGpuEngine3dReg.IndexArrayFormat);
- int IndexFirst = ReadRegister(NvGpuEngine3dReg.IndexBatchFirst);
- int IndexCount = ReadRegister(NvGpuEngine3dReg.IndexBatchCount);
- GalIndexFormat IndexFormat = (GalIndexFormat)IndexSize;
- IndexSize = 1 << IndexSize;
- if (IndexSize > 4)
- {
- throw new InvalidOperationException();
- }
- if (IndexSize != 0)
- {
- IndexPosition = Gpu.GetCpuAddr(IndexPosition);
- int BufferSize = IndexCount * IndexSize;
- byte[] Data = AMemoryHelper.ReadBytes(Memory, IndexPosition, BufferSize);
- Gpu.Renderer.SetIndexArray(Data, IndexFormat);
- }
- List<GalVertexAttrib>[] Attribs = new List<GalVertexAttrib>[32];
- for (int Attr = 0; Attr < 16; Attr++)
- {
- int Packed = ReadRegister(NvGpuEngine3dReg.VertexAttribNFormat + Attr);
- int ArrayIndex = Packed & 0x1f;
- if (Attribs[ArrayIndex] == null)
- {
- Attribs[ArrayIndex] = new List<GalVertexAttrib>();
- }
- Attribs[ArrayIndex].Add(new GalVertexAttrib(
- Attr,
- ((Packed >> 6) & 0x1) != 0,
- (Packed >> 7) & 0x3fff,
- (GalVertexAttribSize)((Packed >> 21) & 0x3f),
- (GalVertexAttribType)((Packed >> 27) & 0x7),
- ((Packed >> 31) & 0x1) != 0));
- }
- for (int Index = 0; Index < 32; Index++)
- {
- int VertexFirst = ReadRegister(NvGpuEngine3dReg.VertexArrayFirst);
- int VertexCount = ReadRegister(NvGpuEngine3dReg.VertexArrayCount);
- int Control = ReadRegister(NvGpuEngine3dReg.VertexArrayNControl + Index * 4);
- bool Enable = (Control & 0x1000) != 0;
- long VertexPosition = MakeInt64From2xInt32(NvGpuEngine3dReg.VertexArrayNAddress + Index * 4);
- if (!Enable)
- {
- continue;
- }
- int Stride = Control & 0xfff;
- long Size = 0;
- if (IndexCount != 0)
- {
- Size = GetVertexCountFromIndexBuffer(
- Memory,
- IndexPosition,
- IndexCount,
- IndexSize);
- }
- else
- {
- Size = VertexCount;
- }
- //TODO: Support cases where the Stride is 0.
- //In this case, we need to use the size of the attribute.
- Size *= Stride;
- VertexPosition = Gpu.GetCpuAddr(VertexPosition);
- byte[] Data = AMemoryHelper.ReadBytes(Memory, VertexPosition, Size);
- GalVertexAttrib[] AttribArray = Attribs[Index]?.ToArray() ?? new GalVertexAttrib[0];
- Gpu.Renderer.SetVertexArray(Index, Stride, Data, AttribArray);
- int PrimCtrl = ReadRegister(NvGpuEngine3dReg.VertexBeginGl);
- GalPrimitiveType PrimType = (GalPrimitiveType)(PrimCtrl & 0xffff);
- if (IndexCount != 0)
- {
- Gpu.Renderer.DrawElements(Index, IndexFirst, PrimType);
- }
- else
- {
- Gpu.Renderer.DrawArrays(Index, VertexFirst, VertexCount, PrimType);
- }
- }
- }
- private int GetVertexCountFromIndexBuffer(
- AMemory Memory,
- long IndexPosition,
- int IndexCount,
- int IndexSize)
- {
- int MaxIndex = -1;
- if (IndexSize == 2)
- {
- while (IndexCount -- > 0)
- {
- ushort Value = Memory.ReadUInt16(IndexPosition);
- IndexPosition += 2;
- if (MaxIndex < Value)
- {
- MaxIndex = Value;
- }
- }
- }
- else if (IndexSize == 1)
- {
- while (IndexCount -- > 0)
- {
- byte Value = Memory.ReadByte(IndexPosition++);
- if (MaxIndex < Value)
- {
- MaxIndex = Value;
- }
- }
- }
- else if (IndexSize == 4)
- {
- while (IndexCount -- > 0)
- {
- uint Value = Memory.ReadUInt32(IndexPosition);
- IndexPosition += 2;
- if (MaxIndex < Value)
- {
- MaxIndex = (int)Value;
- }
- }
- }
- else
- {
- throw new ArgumentOutOfRangeException(nameof(IndexSize));
- }
- return MaxIndex + 1;
- }
- private void QueryControl(AMemory Memory, NsGpuPBEntry PBEntry)
- {
- if (TryGetCpuAddr(NvGpuEngine3dReg.QueryAddress, out long Position))
- {
- int Seq = Registers[(int)NvGpuEngine3dReg.QuerySequence];
- int Ctrl = Registers[(int)NvGpuEngine3dReg.QueryControl];
- int Mode = Ctrl & 3;
- if (Mode == 0)
- {
- //Write mode.
- Memory.WriteInt32(Position, Seq);
- }
- }
- WriteRegister(PBEntry);
- }
- private void CbData(AMemory Memory, NsGpuPBEntry PBEntry)
- {
- if (TryGetCpuAddr(NvGpuEngine3dReg.ConstBufferNAddress, out long Position))
- {
- int Offset = ReadRegister(NvGpuEngine3dReg.ConstBufferNOffset);
- foreach (int Arg in PBEntry.Arguments)
- {
- Memory.WriteInt32(Position + Offset, Arg);
- Offset += 4;
- }
- WriteRegister(NvGpuEngine3dReg.ConstBufferNOffset, Offset);
- }
- }
- private void CbBind(AMemory Memory, NsGpuPBEntry PBEntry)
- {
- int Index = PBEntry.Arguments[0];
- bool Enabled = (Index & 1) != 0;
- Index = (Index >> 4) & 0x1f;
- if (TryGetCpuAddr(NvGpuEngine3dReg.ConstBufferNAddress, out long Position))
- {
- ConstBuffers[Index].Position = Position;
- ConstBuffers[Index].Enabled = Enabled;
- ConstBuffers[Index].Size = ReadRegister(NvGpuEngine3dReg.ConstBufferNSize);
- }
- }
- private int ReadCb(AMemory Memory, int Cbuf, int Offset)
- {
- long Position = ConstBuffers[Cbuf].Position;
- int Value = Memory.ReadInt32(Position + Offset);
- return Value;
- }
- private bool TryGetCpuAddr(NvGpuEngine3dReg Reg, out long Position)
- {
- Position = MakeInt64From2xInt32(Reg);
- Position = Gpu.GetCpuAddr(Position);
- return Position != -1;
- }
- private long MakeInt64From2xInt32(NvGpuEngine3dReg Reg)
- {
- return
- (long)Registers[(int)Reg + 0] << 32 |
- (uint)Registers[(int)Reg + 1];
- }
- private void WriteRegister(NsGpuPBEntry PBEntry)
- {
- int ArgsCount = PBEntry.Arguments.Count;
- if (ArgsCount > 0)
- {
- Registers[PBEntry.Method] = PBEntry.Arguments[ArgsCount - 1];
- }
- }
- private int ReadRegister(NvGpuEngine3dReg Reg)
- {
- return Registers[(int)Reg];
- }
- private void WriteRegister(NvGpuEngine3dReg Reg, int Value)
- {
- Registers[(int)Reg] = Value;
- }
- public bool IsFrameBufferPosition(long Position)
- {
- return FrameBuffers.Contains(Position);
- }
- }
- }
|