using Ryujinx.Common.Logging; using Ryujinx.Graphics.GAL; using Ryujinx.Graphics.Gpu.Image; using Ryujinx.Graphics.Gpu.Memory; using Ryujinx.Graphics.Gpu.Shader; using Ryujinx.Graphics.Gpu.State; using Ryujinx.Graphics.Shader; using Ryujinx.Graphics.Texture; using System; using System.Linq; using System.Runtime.InteropServices; namespace Ryujinx.Graphics.Gpu.Engine { using Texture = Image.Texture; /// /// GPU method implementations. /// partial class Methods { private readonly GpuContext _context; private readonly ShaderProgramInfo[] _currentProgramInfo; /// /// In-memory shader cache. /// public ShaderCache ShaderCache { get; } /// /// GPU buffer manager. /// public BufferManager BufferManager { get; } /// /// GPU texture manager. /// public TextureManager TextureManager { get; } private bool _isAnyVbInstanced; private bool _vsUsesInstanceId; private byte _vsClipDistancesWritten; private bool _forceShaderUpdate; private bool _prevTfEnable; /// /// Creates a new instance of the GPU methods class. /// /// GPU context public Methods(GpuContext context) { _context = context; ShaderCache = new ShaderCache(_context); _currentProgramInfo = new ShaderProgramInfo[Constants.ShaderStages]; BufferManager = new BufferManager(context); TextureManager = new TextureManager(context); context.MemoryManager.MemoryUnmapped += _counterCache.MemoryUnmappedHandler; context.MemoryManager.MemoryUnmapped += TextureManager.MemoryUnmappedHandler; context.MemoryManager.MemoryUnmapped += BufferManager.MemoryUnmappedHandler; } /// /// Register callback for GPU method calls that triggers an action on the GPU. /// /// GPU state where the triggers will be registered public void RegisterCallbacks(GpuState state) { state.RegisterCallback(MethodOffset.LaunchDma, LaunchDma); state.RegisterCallback(MethodOffset.LoadInlineData, LoadInlineData); state.RegisterCallback(MethodOffset.Dispatch, Dispatch); state.RegisterCallback(MethodOffset.SyncpointAction, IncrementSyncpoint); state.RegisterCallback(MethodOffset.CopyBuffer, CopyBuffer); state.RegisterCallback(MethodOffset.CopyTexture, CopyTexture); state.RegisterCallback(MethodOffset.TextureBarrier, TextureBarrier); state.RegisterCallback(MethodOffset.TextureBarrierTiled, TextureBarrierTiled); state.RegisterCallback(MethodOffset.VbElementU8, VbElementU8); state.RegisterCallback(MethodOffset.VbElementU16, VbElementU16); state.RegisterCallback(MethodOffset.VbElementU32, VbElementU32); state.RegisterCallback(MethodOffset.ResetCounter, ResetCounter); state.RegisterCallback(MethodOffset.DrawEnd, DrawEnd); state.RegisterCallback(MethodOffset.DrawBegin, DrawBegin); state.RegisterCallback(MethodOffset.DrawIndexedSmall, DrawIndexedSmall); state.RegisterCallback(MethodOffset.DrawIndexedSmall2, DrawIndexedSmall2); state.RegisterCallback(MethodOffset.DrawIndexedSmallIncInstance, DrawIndexedSmallIncInstance); state.RegisterCallback(MethodOffset.DrawIndexedSmallIncInstance2, DrawIndexedSmallIncInstance2); state.RegisterCallback(MethodOffset.IndexBufferCount, SetIndexBufferCount); state.RegisterCallback(MethodOffset.Clear, Clear); state.RegisterCallback(MethodOffset.Report, Report); state.RegisterCallback(MethodOffset.FirmwareCall4, FirmwareCall4); state.RegisterCallback(MethodOffset.UniformBufferUpdateData, 16, UniformBufferUpdate); state.RegisterCallback(MethodOffset.UniformBufferBindVertex, UniformBufferBindVertex); state.RegisterCallback(MethodOffset.UniformBufferBindTessControl, UniformBufferBindTessControl); state.RegisterCallback(MethodOffset.UniformBufferBindTessEvaluation, UniformBufferBindTessEvaluation); state.RegisterCallback(MethodOffset.UniformBufferBindGeometry, UniformBufferBindGeometry); state.RegisterCallback(MethodOffset.UniformBufferBindFragment, UniformBufferBindFragment); } /// /// Updates host state based on the current guest GPU state. /// /// Guest GPU state /// Index of the first index buffer element used on the draw /// Number of index buffer elements used on the draw private void UpdateState(GpuState state, int firstIndex, int indexCount) { bool tfEnable = state.Get(MethodOffset.TfEnable); if (!tfEnable && _prevTfEnable) { _context.Renderer.Pipeline.EndTransformFeedback(); _prevTfEnable = false; } // Shaders must be the first one to be updated if modified, because // some of the other state depends on information from the currently // bound shaders. if (state.QueryModified(MethodOffset.ShaderBaseAddress, MethodOffset.ShaderState) || _forceShaderUpdate) { _forceShaderUpdate = false; UpdateShaderState(state); } if (state.QueryModified(MethodOffset.TfBufferState)) { UpdateTfBufferState(state); } if (state.QueryModified(MethodOffset.ClipDistanceEnable)) { UpdateUserClipState(state); } if (state.QueryModified(MethodOffset.RasterizeEnable)) { UpdateRasterizerState(state); } if (state.QueryModified(MethodOffset.RtColorState, MethodOffset.RtDepthStencilState, MethodOffset.RtControl, MethodOffset.RtDepthStencilSize, MethodOffset.RtDepthStencilEnable)) { UpdateRenderTargetState(state, useControl: true); } if (state.QueryModified(MethodOffset.ScissorState)) { UpdateScissorState(state); } if (state.QueryModified(MethodOffset.ViewVolumeClipControl)) { UpdateDepthClampState(state); } if (state.QueryModified(MethodOffset.AlphaTestEnable, MethodOffset.AlphaTestRef, MethodOffset.AlphaTestFunc)) { UpdateAlphaTestState(state); } if (state.QueryModified(MethodOffset.DepthTestEnable, MethodOffset.DepthWriteEnable, MethodOffset.DepthTestFunc)) { UpdateDepthTestState(state); } if (state.QueryModified(MethodOffset.DepthMode, MethodOffset.ViewportTransform, MethodOffset.ViewportExtents)) { UpdateViewportTransform(state); } if (state.QueryModified(MethodOffset.DepthBiasState, MethodOffset.DepthBiasFactor, MethodOffset.DepthBiasUnits, MethodOffset.DepthBiasClamp)) { UpdateDepthBiasState(state); } if (state.QueryModified(MethodOffset.StencilBackMasks, MethodOffset.StencilTestState, MethodOffset.StencilBackTestState)) { UpdateStencilTestState(state); } // Pools. if (state.QueryModified(MethodOffset.SamplerPoolState, MethodOffset.SamplerIndex)) { UpdateSamplerPoolState(state); } if (state.QueryModified(MethodOffset.TexturePoolState)) { UpdateTexturePoolState(state); } // Input assembler state. if (state.QueryModified(MethodOffset.VertexAttribState)) { UpdateVertexAttribState(state); } if (state.QueryModified(MethodOffset.PointSize, MethodOffset.VertexProgramPointSize, MethodOffset.PointSpriteEnable, MethodOffset.PointCoordReplace)) { UpdatePointState(state); } if (state.QueryModified(MethodOffset.PrimitiveRestartState)) { UpdatePrimitiveRestartState(state); } if (state.QueryModified(MethodOffset.IndexBufferState)) { UpdateIndexBufferState(state, firstIndex, indexCount); } if (state.QueryModified(MethodOffset.VertexBufferDrawState, MethodOffset.VertexBufferInstanced, MethodOffset.VertexBufferState, MethodOffset.VertexBufferEndAddress)) { UpdateVertexBufferState(state); } if (state.QueryModified(MethodOffset.FaceState)) { UpdateFaceState(state); } if (state.QueryModified(MethodOffset.RtColorMaskShared, MethodOffset.RtColorMask)) { UpdateRtColorMask(state); } if (state.QueryModified(MethodOffset.BlendIndependent, MethodOffset.BlendConstant, MethodOffset.BlendStateCommon, MethodOffset.BlendEnableCommon, MethodOffset.BlendEnable, MethodOffset.BlendState)) { UpdateBlendState(state); } if (state.QueryModified(MethodOffset.LogicOpState)) { UpdateLogicOpState(state); } CommitBindings(); if (tfEnable && !_prevTfEnable) { _context.Renderer.Pipeline.BeginTransformFeedback(Topology); _prevTfEnable = true; } } /// /// Updates Rasterizer primitive discard state based on guest gpu state. /// /// Current GPU state private void UpdateRasterizerState(GpuState state) { Boolean32 enable = state.Get(MethodOffset.RasterizeEnable); _context.Renderer.Pipeline.SetRasterizerDiscard(!enable); } /// /// Ensures that the bindings are visible to the host GPU. /// Note: this actually performs the binding using the host graphics API. /// private void CommitBindings() { UpdateStorageBuffers(); TextureManager.CommitGraphicsBindings(); BufferManager.CommitGraphicsBindings(); } /// /// Updates storage buffer bindings. /// private void UpdateStorageBuffers() { for (int stage = 0; stage < _currentProgramInfo.Length; stage++) { ShaderProgramInfo info = _currentProgramInfo[stage]; if (info == null) { continue; } for (int index = 0; index < info.SBuffers.Count; index++) { BufferDescriptor sb = info.SBuffers[index]; ulong sbDescAddress = BufferManager.GetGraphicsUniformBufferAddress(stage, 0); int sbDescOffset = 0x110 + stage * 0x100 + sb.Slot * 0x10; sbDescAddress += (ulong)sbDescOffset; SbDescriptor sbDescriptor = _context.PhysicalMemory.Read(sbDescAddress); BufferManager.SetGraphicsStorageBuffer(stage, sb.Slot, sbDescriptor.PackAddress(), (uint)sbDescriptor.Size, sb.Flags); } } } /// /// Updates render targets (color and depth-stencil buffers) based on current render target state. /// /// Current GPU state /// Use draw buffers information from render target control register /// If this is not -1, it indicates that only the given indexed target will be used. private void UpdateRenderTargetState(GpuState state, bool useControl, int singleUse = -1) { var rtControl = state.Get(MethodOffset.RtControl); int count = useControl ? rtControl.UnpackCount() : Constants.TotalRenderTargets; var msaaMode = state.Get(MethodOffset.RtMsaaMode); int samplesInX = msaaMode.SamplesInX(); int samplesInY = msaaMode.SamplesInY(); var scissor = state.Get(MethodOffset.ScreenScissorState); Size sizeHint = new Size(scissor.X + scissor.Width, scissor.Y + scissor.Height, 1); bool changedScale = false; for (int index = 0; index < Constants.TotalRenderTargets; index++) { int rtIndex = useControl ? rtControl.UnpackPermutationIndex(index) : index; var colorState = state.Get(MethodOffset.RtColorState, rtIndex); if (index >= count || !IsRtEnabled(colorState)) { changedScale |= TextureManager.SetRenderTargetColor(index, null); continue; } Texture color = TextureManager.FindOrCreateTexture(colorState, samplesInX, samplesInY, sizeHint); changedScale |= TextureManager.SetRenderTargetColor(index, color); } bool dsEnable = state.Get(MethodOffset.RtDepthStencilEnable); Texture depthStencil = null; if (dsEnable) { var dsState = state.Get(MethodOffset.RtDepthStencilState); var dsSize = state.Get(MethodOffset.RtDepthStencilSize); depthStencil = TextureManager.FindOrCreateTexture(dsState, dsSize, samplesInX, samplesInY, sizeHint); } changedScale |= TextureManager.SetRenderTargetDepthStencil(depthStencil); if (changedScale) { TextureManager.UpdateRenderTargetScale(singleUse); _context.Renderer.Pipeline.SetRenderTargetScale(TextureManager.RenderTargetScale); UpdateViewportTransform(state); UpdateScissorState(state); } } /// /// Checks if a render target color buffer is used. /// /// Color buffer information /// True if the specified buffer is enabled/used, false otherwise private static bool IsRtEnabled(RtColorState colorState) { // Colors are disabled by writing 0 to the format. return colorState.Format != 0 && colorState.WidthOrStride != 0; } /// /// Updates host scissor test state based on current GPU state. /// /// Current GPU state private void UpdateScissorState(GpuState state) { for (int index = 0; index < Constants.TotalViewports; index++) { ScissorState scissor = state.Get(MethodOffset.ScissorState, index); bool enable = scissor.Enable && (scissor.X1 != 0 || scissor.Y1 != 0 || scissor.X2 != 0xffff || scissor.Y2 != 0xffff); if (enable) { int x = scissor.X1; int y = scissor.Y1; int width = scissor.X2 - x; int height = scissor.Y2 - y; float scale = TextureManager.RenderTargetScale; if (scale != 1f) { x = (int)(x * scale); y = (int)(y * scale); width = (int)Math.Ceiling(width * scale); height = (int)Math.Ceiling(height * scale); } _context.Renderer.Pipeline.SetScissor(index, true, x, y, width, height); } else { _context.Renderer.Pipeline.SetScissor(index, false, 0, 0, 0, 0); } } } /// /// Updates host depth clamp state based on current GPU state. /// /// Current GPU state private void UpdateDepthClampState(GpuState state) { ViewVolumeClipControl clip = state.Get(MethodOffset.ViewVolumeClipControl); _context.Renderer.Pipeline.SetDepthClamp((clip & ViewVolumeClipControl.DepthClampDisabled) == 0); } /// /// Updates host alpha test state based on current GPU state. /// /// Current GPU state private void UpdateAlphaTestState(GpuState state) { _context.Renderer.Pipeline.SetAlphaTest( state.Get(MethodOffset.AlphaTestEnable), state.Get(MethodOffset.AlphaTestRef), state.Get(MethodOffset.AlphaTestFunc)); } /// /// Updates host depth test state based on current GPU state. /// /// Current GPU state private void UpdateDepthTestState(GpuState state) { _context.Renderer.Pipeline.SetDepthTest(new DepthTestDescriptor( state.Get(MethodOffset.DepthTestEnable), state.Get(MethodOffset.DepthWriteEnable), state.Get(MethodOffset.DepthTestFunc))); } /// /// Updates host viewport transform and clipping state based on current GPU state. /// /// Current GPU state private void UpdateViewportTransform(GpuState state) { var yControl = state.Get (MethodOffset.YControl); var face = state.Get(MethodOffset.FaceState); UpdateFrontFace(yControl, face.FrontFace); bool flipY = yControl.HasFlag(YControl.NegateY); Span viewports = stackalloc Viewport[Constants.TotalViewports]; for (int index = 0; index < Constants.TotalViewports; index++) { var transform = state.Get(MethodOffset.ViewportTransform, index); var extents = state.Get (MethodOffset.ViewportExtents, index); float scaleX = MathF.Abs(transform.ScaleX); float scaleY = transform.ScaleY; if (flipY) { scaleY = -scaleY; } if (!_context.Capabilities.SupportsViewportSwizzle && transform.UnpackSwizzleY() == ViewportSwizzle.NegativeY) { scaleY = -scaleY; } if (index == 0) { // Try to guess the depth mode being used on the high level API // based on current transform. // It is setup like so by said APIs: // If depth mode is ZeroToOne: // TranslateZ = Near // ScaleZ = Far - Near // If depth mode is MinusOneToOne: // TranslateZ = (Near + Far) / 2 // ScaleZ = (Far - Near) / 2 // DepthNear/Far are sorted such as that Near is always less than Far. DepthMode depthMode = extents.DepthNear != transform.TranslateZ && extents.DepthFar != transform.TranslateZ ? DepthMode.MinusOneToOne : DepthMode.ZeroToOne; _context.Renderer.Pipeline.SetDepthMode(depthMode); } float x = transform.TranslateX - scaleX; float y = transform.TranslateY - scaleY; float width = scaleX * 2; float height = scaleY * 2; float scale = TextureManager.RenderTargetScale; if (scale != 1f) { x *= scale; y *= scale; width *= scale; height *= scale; } RectangleF region = new RectangleF(x, y, width, height); ViewportSwizzle swizzleX = transform.UnpackSwizzleX(); ViewportSwizzle swizzleY = transform.UnpackSwizzleY(); ViewportSwizzle swizzleZ = transform.UnpackSwizzleZ(); ViewportSwizzle swizzleW = transform.UnpackSwizzleW(); float depthNear = extents.DepthNear; float depthFar = extents.DepthFar; if (transform.ScaleZ < 0) { float temp = depthNear; depthNear = depthFar; depthFar = temp; } viewports[index] = new Viewport(region, swizzleX, swizzleY, swizzleZ, swizzleW, depthNear, depthFar); } _context.Renderer.Pipeline.SetViewports(0, viewports); } /// /// Updates host depth bias (also called polygon offset) state based on current GPU state. /// /// Current GPU state private void UpdateDepthBiasState(GpuState state) { var depthBias = state.Get(MethodOffset.DepthBiasState); float factor = state.Get(MethodOffset.DepthBiasFactor); float units = state.Get(MethodOffset.DepthBiasUnits); float clamp = state.Get(MethodOffset.DepthBiasClamp); PolygonModeMask enables; enables = (depthBias.PointEnable ? PolygonModeMask.Point : 0); enables |= (depthBias.LineEnable ? PolygonModeMask.Line : 0); enables |= (depthBias.FillEnable ? PolygonModeMask.Fill : 0); _context.Renderer.Pipeline.SetDepthBias(enables, factor, units / 2f, clamp); } /// /// Updates host stencil test state based on current GPU state. /// /// Current GPU state private void UpdateStencilTestState(GpuState state) { var backMasks = state.Get(MethodOffset.StencilBackMasks); var test = state.Get(MethodOffset.StencilTestState); var backTest = state.Get(MethodOffset.StencilBackTestState); CompareOp backFunc; StencilOp backSFail; StencilOp backDpPass; StencilOp backDpFail; int backFuncRef; int backFuncMask; int backMask; if (backTest.TwoSided) { backFunc = backTest.BackFunc; backSFail = backTest.BackSFail; backDpPass = backTest.BackDpPass; backDpFail = backTest.BackDpFail; backFuncRef = backMasks.FuncRef; backFuncMask = backMasks.FuncMask; backMask = backMasks.Mask; } else { backFunc = test.FrontFunc; backSFail = test.FrontSFail; backDpPass = test.FrontDpPass; backDpFail = test.FrontDpFail; backFuncRef = test.FrontFuncRef; backFuncMask = test.FrontFuncMask; backMask = test.FrontMask; } _context.Renderer.Pipeline.SetStencilTest(new StencilTestDescriptor( test.Enable, test.FrontFunc, test.FrontSFail, test.FrontDpPass, test.FrontDpFail, test.FrontFuncRef, test.FrontFuncMask, test.FrontMask, backFunc, backSFail, backDpPass, backDpFail, backFuncRef, backFuncMask, backMask)); } /// /// Updates current sampler pool address and size based on guest GPU state. /// /// Current GPU state private void UpdateSamplerPoolState(GpuState state) { var texturePool = state.Get(MethodOffset.TexturePoolState); var samplerPool = state.Get(MethodOffset.SamplerPoolState); var samplerIndex = state.Get(MethodOffset.SamplerIndex); int maximumId = samplerIndex == SamplerIndex.ViaHeaderIndex ? texturePool.MaximumId : samplerPool.MaximumId; TextureManager.SetGraphicsSamplerPool(samplerPool.Address.Pack(), maximumId, samplerIndex); } /// /// Updates current texture pool address and size based on guest GPU state. /// /// Current GPU state private void UpdateTexturePoolState(GpuState state) { var texturePool = state.Get(MethodOffset.TexturePoolState); TextureManager.SetGraphicsTexturePool(texturePool.Address.Pack(), texturePool.MaximumId); TextureManager.SetGraphicsTextureBufferIndex(state.Get(MethodOffset.TextureBufferIndex)); } /// /// Updates host vertex attributes based on guest GPU state. /// /// Current GPU state private void UpdateVertexAttribState(GpuState state) { Span vertexAttribs = stackalloc VertexAttribDescriptor[Constants.TotalVertexAttribs]; for (int index = 0; index < Constants.TotalVertexAttribs; index++) { var vertexAttrib = state.Get(MethodOffset.VertexAttribState, index); if (!FormatTable.TryGetAttribFormat(vertexAttrib.UnpackFormat(), out Format format)) { Logger.Debug?.Print(LogClass.Gpu, $"Invalid attribute format 0x{vertexAttrib.UnpackFormat():X}."); format = Format.R32G32B32A32Float; } vertexAttribs[index] = new VertexAttribDescriptor( vertexAttrib.UnpackBufferIndex(), vertexAttrib.UnpackOffset(), vertexAttrib.UnpackIsConstant(), format); } _context.Renderer.Pipeline.SetVertexAttribs(vertexAttribs); } /// /// Updates host point size based on guest GPU state. /// /// Current GPU state private void UpdatePointState(GpuState state) { float size = state.Get(MethodOffset.PointSize); bool isProgramPointSize = state.Get(MethodOffset.VertexProgramPointSize); bool enablePointSprite = state.Get(MethodOffset.PointSpriteEnable); // TODO: Need to figure out a way to map PointCoordReplace enable bit. Origin origin = (state.Get(MethodOffset.PointCoordReplace) & 4) == 0 ? Origin.LowerLeft : Origin.UpperLeft; _context.Renderer.Pipeline.SetPointParameters(size, isProgramPointSize, enablePointSprite, origin); } /// /// Updates host primitive restart based on guest GPU state. /// /// Current GPU state private void UpdatePrimitiveRestartState(GpuState state) { PrimitiveRestartState primitiveRestart = state.Get(MethodOffset.PrimitiveRestartState); _context.Renderer.Pipeline.SetPrimitiveRestart( primitiveRestart.Enable, primitiveRestart.Index); } /// /// Updates host index buffer binding based on guest GPU state. /// /// Current GPU state /// Index of the first index buffer element used on the draw /// Number of index buffer elements used on the draw private void UpdateIndexBufferState(GpuState state, int firstIndex, int indexCount) { var indexBuffer = state.Get(MethodOffset.IndexBufferState); if (indexCount == 0) { return; } ulong gpuVa = indexBuffer.Address.Pack(); // Do not use the end address to calculate the size, because // the result may be much larger than the real size of the index buffer. ulong size = (ulong)(firstIndex + indexCount); switch (indexBuffer.Type) { case IndexType.UShort: size *= 2; break; case IndexType.UInt: size *= 4; break; } BufferManager.SetIndexBuffer(gpuVa, size, indexBuffer.Type); // The index buffer affects the vertex buffer size calculation, we // need to ensure that they are updated. UpdateVertexBufferState(state); } /// /// Updates host vertex buffer bindings based on guest GPU state. /// /// Current GPU state private void UpdateVertexBufferState(GpuState state) { _isAnyVbInstanced = false; for (int index = 0; index < Constants.TotalVertexBuffers; index++) { var vertexBuffer = state.Get(MethodOffset.VertexBufferState, index); if (!vertexBuffer.UnpackEnable()) { BufferManager.SetVertexBuffer(index, 0, 0, 0, 0); continue; } GpuVa endAddress = state.Get(MethodOffset.VertexBufferEndAddress, index); ulong address = vertexBuffer.Address.Pack(); int stride = vertexBuffer.UnpackStride(); bool instanced = state.Get(MethodOffset.VertexBufferInstanced + index); int divisor = instanced ? vertexBuffer.Divisor : 0; _isAnyVbInstanced |= divisor != 0; ulong size; if (_ibStreamer.HasInlineIndexData || _drawIndexed || stride == 0 || instanced) { // This size may be (much) larger than the real vertex buffer size. // Avoid calculating it this way, unless we don't have any other option. size = endAddress.Pack() - address + 1; } else { // For non-indexed draws, we can guess the size from the vertex count // and stride. int firstInstance = state.Get(MethodOffset.FirstInstance); var drawState = state.Get(MethodOffset.VertexBufferDrawState); size = (ulong)((firstInstance + drawState.First + drawState.Count) * stride); } BufferManager.SetVertexBuffer(index, address, size, stride, divisor); } } /// /// Updates host face culling and orientation based on guest GPU state. /// /// Current GPU state private void UpdateFaceState(GpuState state) { var yControl = state.Get (MethodOffset.YControl); var face = state.Get(MethodOffset.FaceState); _context.Renderer.Pipeline.SetFaceCulling(face.CullEnable, face.CullFace); UpdateFrontFace(yControl, face.FrontFace); } /// /// Updates the front face based on the current front face and the origin. /// /// Y control register value, where the origin is located /// Front face private void UpdateFrontFace(YControl yControl, FrontFace frontFace) { bool isUpperLeftOrigin = !yControl.HasFlag(YControl.TriangleRastFlip); if (isUpperLeftOrigin) { frontFace = frontFace == FrontFace.CounterClockwise ? FrontFace.Clockwise : FrontFace.CounterClockwise; } _context.Renderer.Pipeline.SetFrontFace(frontFace); } /// /// Updates host render target color masks, based on guest GPU state. /// This defines which color channels are written to each color buffer. /// /// Current GPU state private void UpdateRtColorMask(GpuState state) { bool rtColorMaskShared = state.Get(MethodOffset.RtColorMaskShared); Span componentMasks = stackalloc uint[Constants.TotalRenderTargets]; for (int index = 0; index < Constants.TotalRenderTargets; index++) { var colorMask = state.Get(MethodOffset.RtColorMask, rtColorMaskShared ? 0 : index); uint componentMask; componentMask = (colorMask.UnpackRed() ? 1u : 0u); componentMask |= (colorMask.UnpackGreen() ? 2u : 0u); componentMask |= (colorMask.UnpackBlue() ? 4u : 0u); componentMask |= (colorMask.UnpackAlpha() ? 8u : 0u); componentMasks[index] = componentMask; } _context.Renderer.Pipeline.SetRenderTargetColorMasks(componentMasks); } /// /// Updates host render target color buffer blending state, based on guest state. /// /// Current GPU state private void UpdateBlendState(GpuState state) { bool blendIndependent = state.Get(MethodOffset.BlendIndependent); ColorF blendConstant = state.Get(MethodOffset.BlendConstant); for (int index = 0; index < Constants.TotalRenderTargets; index++) { BlendDescriptor descriptor; if (blendIndependent) { bool enable = state.Get (MethodOffset.BlendEnable, index); var blend = state.Get(MethodOffset.BlendState, index); descriptor = new BlendDescriptor( enable, blendConstant, blend.ColorOp, blend.ColorSrcFactor, blend.ColorDstFactor, blend.AlphaOp, blend.AlphaSrcFactor, blend.AlphaDstFactor); } else { bool enable = state.Get (MethodOffset.BlendEnable, 0); var blend = state.Get(MethodOffset.BlendStateCommon); descriptor = new BlendDescriptor( enable, blendConstant, blend.ColorOp, blend.ColorSrcFactor, blend.ColorDstFactor, blend.AlphaOp, blend.AlphaSrcFactor, blend.AlphaDstFactor); } _context.Renderer.Pipeline.SetBlendState(index, descriptor); } } /// /// Updates host logical operation state, based on guest state. /// /// Current GPU state public void UpdateLogicOpState(GpuState state) { LogicalOpState logicOpState = state.Get(MethodOffset.LogicOpState); _context.Renderer.Pipeline.SetLogicOpState(logicOpState.Enable, logicOpState.LogicalOp); } /// /// Storage buffer address and size information. /// private struct SbDescriptor { #pragma warning disable CS0649 public uint AddressLow; public uint AddressHigh; public int Size; public int Padding; #pragma warning restore CS0649 public ulong PackAddress() { return AddressLow | ((ulong)AddressHigh << 32); } } /// /// Updates host shaders based on the guest GPU state. /// /// Current GPU state private void UpdateShaderState(GpuState state) { ShaderAddresses addresses = new ShaderAddresses(); Span addressesSpan = MemoryMarshal.CreateSpan(ref addresses, 1); Span addressesArray = MemoryMarshal.Cast(addressesSpan); ulong baseAddress = state.Get(MethodOffset.ShaderBaseAddress).Pack(); for (int index = 0; index < 6; index++) { var shader = state.Get(MethodOffset.ShaderState, index); if (!shader.UnpackEnable() && index != 1) { continue; } addressesArray[index] = baseAddress + shader.Offset; } ShaderBundle gs = ShaderCache.GetGraphicsShader(state, addresses); byte oldVsClipDistancesWritten = _vsClipDistancesWritten; _vsUsesInstanceId = gs.Shaders[0]?.Info.UsesInstanceId ?? false; _vsClipDistancesWritten = gs.Shaders[0]?.Info.ClipDistancesWritten ?? 0; if (oldVsClipDistancesWritten != _vsClipDistancesWritten) { UpdateUserClipState(state); } int storageBufferBindingsCount = 0; int uniformBufferBindingsCount = 0; for (int stage = 0; stage < Constants.ShaderStages; stage++) { ShaderProgramInfo info = gs.Shaders[stage]?.Info; _currentProgramInfo[stage] = info; if (info == null) { TextureManager.SetGraphicsTextures(stage, Array.Empty()); TextureManager.SetGraphicsImages(stage, Array.Empty()); BufferManager.SetGraphicsStorageBufferBindings(stage, null); BufferManager.SetGraphicsUniformBufferBindings(stage, null); continue; } var textureBindings = new TextureBindingInfo[info.Textures.Count]; for (int index = 0; index < info.Textures.Count; index++) { var descriptor = info.Textures[index]; Target target = ShaderTexture.GetTarget(descriptor.Type); textureBindings[index] = new TextureBindingInfo( target, descriptor.Binding, descriptor.CbufSlot, descriptor.HandleIndex, descriptor.Flags); } TextureManager.SetGraphicsTextures(stage, textureBindings); var imageBindings = new TextureBindingInfo[info.Images.Count]; for (int index = 0; index < info.Images.Count; index++) { var descriptor = info.Images[index]; Target target = ShaderTexture.GetTarget(descriptor.Type); Format format = ShaderTexture.GetFormat(descriptor.Format); imageBindings[index] = new TextureBindingInfo( target, format, descriptor.Binding, descriptor.CbufSlot, descriptor.HandleIndex, descriptor.Flags); } TextureManager.SetGraphicsImages(stage, imageBindings); BufferManager.SetGraphicsStorageBufferBindings(stage, info.SBuffers); BufferManager.SetGraphicsUniformBufferBindings(stage, info.CBuffers); if (info.SBuffers.Count != 0) { storageBufferBindingsCount = Math.Max(storageBufferBindingsCount, info.SBuffers.Max(x => x.Binding) + 1); } if (info.CBuffers.Count != 0) { uniformBufferBindingsCount = Math.Max(uniformBufferBindingsCount, info.CBuffers.Max(x => x.Binding) + 1); } } BufferManager.SetGraphicsStorageBufferBindingsCount(storageBufferBindingsCount); BufferManager.SetGraphicsUniformBufferBindingsCount(uniformBufferBindingsCount); _context.Renderer.Pipeline.SetProgram(gs.HostProgram); } /// /// Updates transform feedback buffer state based on the guest GPU state. /// /// Current GPU state private void UpdateTfBufferState(GpuState state) { for (int index = 0; index < Constants.TotalTransformFeedbackBuffers; index++) { TfBufferState tfb = state.Get(MethodOffset.TfBufferState, index); if (!tfb.Enable) { BufferManager.SetTransformFeedbackBuffer(index, 0, 0); continue; } BufferManager.SetTransformFeedbackBuffer(index, tfb.Address.Pack(), (uint)tfb.Size); } } /// /// Updates user-defined clipping based on the guest GPU state. /// /// Current GPU state private void UpdateUserClipState(GpuState state) { int clipMask = state.Get(MethodOffset.ClipDistanceEnable) & _vsClipDistancesWritten; for (int i = 0; i < Constants.TotalClipDistances; ++i) { _context.Renderer.Pipeline.SetUserClipDistance(i, (clipMask & (1 << i)) != 0); } } /// /// Issues a texture barrier. /// This waits until previous texture writes from the GPU to finish, before /// performing new operations with said textures. /// /// Current GPU state (unused) /// Method call argument (unused) private void TextureBarrier(GpuState state, int argument) { _context.Renderer.Pipeline.TextureBarrier(); } /// /// Issues a texture barrier. /// This waits until previous texture writes from the GPU to finish, before /// performing new operations with said textures. /// This performs a per-tile wait, it is only valid if both the previous write /// and current access has the same access patterns. /// This may be faster than the regular barrier on tile-based rasterizers. /// /// Current GPU state (unused) /// Method call argument (unused) private void TextureBarrierTiled(GpuState state, int argument) { _context.Renderer.Pipeline.TextureBarrierTiled(); } } }