 f1d1670b0b
			
		
	
	
		f1d1670b0b
		
			
		
	
	
	
	
		
			
			* Implement HLE macro for DrawElementsIndirect * Shader cache version bump * Use GL_ARB_shader_draw_parameters extension on OpenGL * Fix DrawIndexedIndirectCount on Vulkan when extension is not supported * Implement DrawIndex * Alignment * Fix some validation errors * Rename BaseIds to DrawParameters * Fix incorrect index buffer and vertex buffer size in some cases * Add HLE macros for DrawArraysInstanced and DrawElementsInstanced * Perform a regular draw when indirect data is not modified * Use non-indirect draw methods if indirect buffer was not GPU modified * Only check if draw parameters match if the shader actually uses them * Expose Macro HLE setting on GUI * Reset FirstVertex and FirstInstance after draw * Update shader cache version again since some people already tested this * PR feedback Co-authored-by: riperiperi <rhy3756547@hotmail.com>
		
			
				
	
	
		
			851 lines
		
	
	
	
		
			32 KiB
		
	
	
	
		
			C#
		
	
	
	
	
	
			
		
		
	
	
			851 lines
		
	
	
	
		
			32 KiB
		
	
	
	
		
			C#
		
	
	
	
	
	
| using Ryujinx.Graphics.GAL;
 | |
| using Ryujinx.Graphics.Shader;
 | |
| using Ryujinx.Graphics.Shader.Translation;
 | |
| using Ryujinx.Graphics.Vulkan.Shaders;
 | |
| using Silk.NET.Vulkan;
 | |
| using System;
 | |
| using System.Collections.Generic;
 | |
| using VkFormat = Silk.NET.Vulkan.Format;
 | |
| 
 | |
| namespace Ryujinx.Graphics.Vulkan
 | |
| {
 | |
|     class HelperShader : IDisposable
 | |
|     {
 | |
|         private const int UniformBufferAlignment = 256;
 | |
| 
 | |
|         private readonly PipelineHelperShader _pipeline;
 | |
|         private readonly ISampler _samplerLinear;
 | |
|         private readonly ISampler _samplerNearest;
 | |
|         private readonly IProgram _programColorBlit;
 | |
|         private readonly IProgram _programColorBlitClearAlpha;
 | |
|         private readonly IProgram _programColorClear;
 | |
|         private readonly IProgram _programStrideChange;
 | |
|         private readonly IProgram _programColorCopyBetweenMsNonMs;
 | |
|         private readonly IProgram _programConvertIndexBuffer;
 | |
|         private readonly IProgram _programConvertIndirectData;
 | |
| 
 | |
|         public HelperShader(VulkanRenderer gd, Device device)
 | |
|         {
 | |
|             _pipeline = new PipelineHelperShader(gd, device);
 | |
|             _pipeline.Initialize();
 | |
| 
 | |
|             _samplerLinear = gd.CreateSampler(GAL.SamplerCreateInfo.Create(MinFilter.Linear, MagFilter.Linear));
 | |
|             _samplerNearest = gd.CreateSampler(GAL.SamplerCreateInfo.Create(MinFilter.Nearest, MagFilter.Nearest));
 | |
| 
 | |
|             var vertexBindings = new ShaderBindings(
 | |
|                 new[] { 1 },
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>());
 | |
| 
 | |
|             var fragmentBindings = new ShaderBindings(
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>(),
 | |
|                 new[] { 0 },
 | |
|                 Array.Empty<int>());
 | |
| 
 | |
|             _programColorBlit = gd.CreateProgramWithMinimalLayout(new[]
 | |
|             {
 | |
|                 new ShaderSource(ShaderBinaries.ColorBlitVertexShaderSource, vertexBindings, ShaderStage.Vertex, TargetLanguage.Spirv),
 | |
|                 new ShaderSource(ShaderBinaries.ColorBlitFragmentShaderSource, fragmentBindings, ShaderStage.Fragment, TargetLanguage.Spirv),
 | |
|             });
 | |
| 
 | |
|             _programColorBlitClearAlpha = gd.CreateProgramWithMinimalLayout(new[]
 | |
|             {
 | |
|                 new ShaderSource(ShaderBinaries.ColorBlitVertexShaderSource, vertexBindings, ShaderStage.Vertex, TargetLanguage.Spirv),
 | |
|                 new ShaderSource(ShaderBinaries.ColorBlitClearAlphaFragmentShaderSource, fragmentBindings, ShaderStage.Fragment, TargetLanguage.Spirv),
 | |
|             });
 | |
| 
 | |
|             var fragmentBindings2 = new ShaderBindings(
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>());
 | |
| 
 | |
|             _programColorClear = gd.CreateProgramWithMinimalLayout(new[]
 | |
|             {
 | |
|                 new ShaderSource(ShaderBinaries.ColorClearVertexShaderSource, vertexBindings, ShaderStage.Vertex, TargetLanguage.Spirv),
 | |
|                 new ShaderSource(ShaderBinaries.ColorClearFragmentShaderSource, fragmentBindings2, ShaderStage.Fragment, TargetLanguage.Spirv),
 | |
|             });
 | |
| 
 | |
|             var strideChangeBindings = new ShaderBindings(
 | |
|                 new[] { 0 },
 | |
|                 new[] { 1, 2 },
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>());
 | |
| 
 | |
|             _programStrideChange = gd.CreateProgramWithMinimalLayout(new[]
 | |
|             {
 | |
|                 new ShaderSource(ShaderBinaries.ChangeBufferStrideShaderSource, strideChangeBindings, ShaderStage.Compute, TargetLanguage.Spirv),
 | |
|             });
 | |
| 
 | |
|             var colorCopyMSBindings = new ShaderBindings(
 | |
|                 new[] { 0 },
 | |
|                 Array.Empty<int>(),
 | |
|                 new[] { 0 },
 | |
|                 new[] { 0 });
 | |
| 
 | |
|             _programColorCopyBetweenMsNonMs = gd.CreateProgramWithMinimalLayout(new[]
 | |
|             {
 | |
|                 new ShaderSource(ShaderBinaries.ColorCopyBetweenMsNonMs, colorCopyMSBindings, ShaderStage.Compute, TargetLanguage.Spirv),
 | |
|             }, new[]
 | |
|             {
 | |
|                 new SpecDescription((0, SpecConstType.Int32))
 | |
|             });
 | |
| 
 | |
|             var convertIndexBufferBindings = new ShaderBindings(
 | |
|                 new[] { 0 },
 | |
|                 new[] { 1, 2 },
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>());
 | |
| 
 | |
|             _programConvertIndexBuffer = gd.CreateProgramWithMinimalLayout(new[]
 | |
|             {
 | |
|                 new ShaderSource(ShaderBinaries.ConvertIndexBufferShaderSource, convertIndexBufferBindings, ShaderStage.Compute, TargetLanguage.Spirv),
 | |
|             });
 | |
| 
 | |
|             var convertIndirectDataBindings = new ShaderBindings(
 | |
|                 new[] { 0 },
 | |
|                 new[] { 1, 2, 3 },
 | |
|                 Array.Empty<int>(),
 | |
|                 Array.Empty<int>());
 | |
| 
 | |
|             _programConvertIndirectData = gd.CreateProgramWithMinimalLayout(new[]
 | |
|             {
 | |
|                 new ShaderSource(ShaderBinaries.ConvertIndirectDataShaderSource, convertIndirectDataBindings, ShaderStage.Compute, TargetLanguage.Spirv),
 | |
|             });
 | |
|         }
 | |
| 
 | |
|         public void Blit(
 | |
|             VulkanRenderer gd,
 | |
|             TextureView src,
 | |
|             Auto<DisposableImageView> dst,
 | |
|             int dstWidth,
 | |
|             int dstHeight,
 | |
|             VkFormat dstFormat,
 | |
|             Extents2D srcRegion,
 | |
|             Extents2D dstRegion,
 | |
|             bool linearFilter,
 | |
|             bool clearAlpha = false)
 | |
|         {
 | |
|             gd.FlushAllCommands();
 | |
| 
 | |
|             using var cbs = gd.CommandBufferPool.Rent();
 | |
| 
 | |
|             Blit(gd, cbs, src, dst, dstWidth, dstHeight, dstFormat, srcRegion, dstRegion, linearFilter, clearAlpha);
 | |
|         }
 | |
| 
 | |
|         public void Blit(
 | |
|             VulkanRenderer gd,
 | |
|             CommandBufferScoped cbs,
 | |
|             TextureView src,
 | |
|             Auto<DisposableImageView> dst,
 | |
|             int dstWidth,
 | |
|             int dstHeight,
 | |
|             VkFormat dstFormat,
 | |
|             Extents2D srcRegion,
 | |
|             Extents2D dstRegion,
 | |
|             bool linearFilter,
 | |
|             bool clearAlpha = false)
 | |
|         {
 | |
|             _pipeline.SetCommandBuffer(cbs);
 | |
| 
 | |
|             const int RegionBufferSize = 16;
 | |
| 
 | |
|             var sampler = linearFilter ? _samplerLinear : _samplerNearest;
 | |
| 
 | |
|             _pipeline.SetTextureAndSampler(ShaderStage.Fragment, 0, src, sampler);
 | |
| 
 | |
|             Span<float> region = stackalloc float[RegionBufferSize / sizeof(float)];
 | |
| 
 | |
|             region[0] = (float)srcRegion.X1 / src.Width;
 | |
|             region[1] = (float)srcRegion.X2 / src.Width;
 | |
|             region[2] = (float)srcRegion.Y1 / src.Height;
 | |
|             region[3] = (float)srcRegion.Y2 / src.Height;
 | |
| 
 | |
|             if (dstRegion.X1 > dstRegion.X2)
 | |
|             {
 | |
|                 (region[0], region[1]) = (region[1], region[0]);
 | |
|             }
 | |
| 
 | |
|             if (dstRegion.Y1 > dstRegion.Y2)
 | |
|             {
 | |
|                 (region[2], region[3]) = (region[3], region[2]);
 | |
|             }
 | |
| 
 | |
|             var bufferHandle = gd.BufferManager.CreateWithHandle(gd, RegionBufferSize, false);
 | |
| 
 | |
|             gd.BufferManager.SetData<float>(bufferHandle, 0, region);
 | |
| 
 | |
|             _pipeline.SetUniformBuffers(1, stackalloc[] { new BufferRange(bufferHandle, 0, RegionBufferSize) });
 | |
| 
 | |
|             Span<GAL.Viewport> viewports = stackalloc GAL.Viewport[1];
 | |
| 
 | |
|             var rect = new Rectangle<float>(
 | |
|                 MathF.Min(dstRegion.X1, dstRegion.X2),
 | |
|                 MathF.Min(dstRegion.Y1, dstRegion.Y2),
 | |
|                 MathF.Abs(dstRegion.X2 - dstRegion.X1),
 | |
|                 MathF.Abs(dstRegion.Y2 - dstRegion.Y1));
 | |
| 
 | |
|             viewports[0] = new GAL.Viewport(
 | |
|                 rect,
 | |
|                 ViewportSwizzle.PositiveX,
 | |
|                 ViewportSwizzle.PositiveY,
 | |
|                 ViewportSwizzle.PositiveZ,
 | |
|                 ViewportSwizzle.PositiveW,
 | |
|                 0f,
 | |
|                 1f);
 | |
| 
 | |
|             Span<Rectangle<int>> scissors = stackalloc Rectangle<int>[1];
 | |
| 
 | |
|             scissors[0] = new Rectangle<int>(0, 0, dstWidth, dstHeight);
 | |
| 
 | |
|             _pipeline.SetProgram(clearAlpha ? _programColorBlitClearAlpha : _programColorBlit);
 | |
|             _pipeline.SetRenderTarget(dst, (uint)dstWidth, (uint)dstHeight, false, dstFormat);
 | |
|             _pipeline.SetRenderTargetColorMasks(new uint[] { 0xf });
 | |
|             _pipeline.SetScissors(scissors);
 | |
| 
 | |
|             if (clearAlpha)
 | |
|             {
 | |
|                 _pipeline.ClearRenderTargetColor(0, 0, 1, new ColorF(0f, 0f, 0f, 1f));
 | |
|             }
 | |
| 
 | |
|             _pipeline.SetViewports(viewports, false);
 | |
|             _pipeline.SetPrimitiveTopology(GAL.PrimitiveTopology.TriangleStrip);
 | |
|             _pipeline.Draw(4, 1, 0, 0);
 | |
|             _pipeline.Finish(gd, cbs);
 | |
| 
 | |
|             gd.BufferManager.Delete(bufferHandle);
 | |
|         }
 | |
| 
 | |
|         public void Clear(
 | |
|             VulkanRenderer gd,
 | |
|             Auto<DisposableImageView> dst,
 | |
|             ReadOnlySpan<float> clearColor,
 | |
|             uint componentMask,
 | |
|             int dstWidth,
 | |
|             int dstHeight,
 | |
|             VkFormat dstFormat,
 | |
|             Rectangle<int> scissor)
 | |
|         {
 | |
|             const int ClearColorBufferSize = 16;
 | |
| 
 | |
|             gd.FlushAllCommands();
 | |
| 
 | |
|             using var cbs = gd.CommandBufferPool.Rent();
 | |
| 
 | |
|             _pipeline.SetCommandBuffer(cbs);
 | |
| 
 | |
|             var bufferHandle = gd.BufferManager.CreateWithHandle(gd, ClearColorBufferSize, false);
 | |
| 
 | |
|             gd.BufferManager.SetData<float>(bufferHandle, 0, clearColor);
 | |
| 
 | |
|             _pipeline.SetUniformBuffers(1, stackalloc[] { new BufferRange(bufferHandle, 0, ClearColorBufferSize) });
 | |
| 
 | |
|             Span<GAL.Viewport> viewports = stackalloc GAL.Viewport[1];
 | |
| 
 | |
|             viewports[0] = new GAL.Viewport(
 | |
|                 new Rectangle<float>(0, 0, dstWidth, dstHeight),
 | |
|                 ViewportSwizzle.PositiveX,
 | |
|                 ViewportSwizzle.PositiveY,
 | |
|                 ViewportSwizzle.PositiveZ,
 | |
|                 ViewportSwizzle.PositiveW,
 | |
|                 0f,
 | |
|                 1f);
 | |
| 
 | |
|             Span<Rectangle<int>> scissors = stackalloc Rectangle<int>[1];
 | |
| 
 | |
|             scissors[0] = scissor;
 | |
| 
 | |
|             _pipeline.SetProgram(_programColorClear);
 | |
|             _pipeline.SetRenderTarget(dst, (uint)dstWidth, (uint)dstHeight, false, dstFormat);
 | |
|             _pipeline.SetRenderTargetColorMasks(new uint[] { componentMask });
 | |
|             _pipeline.SetViewports(viewports, false);
 | |
|             _pipeline.SetScissors(scissors);
 | |
|             _pipeline.SetPrimitiveTopology(GAL.PrimitiveTopology.TriangleStrip);
 | |
|             _pipeline.Draw(4, 1, 0, 0);
 | |
|             _pipeline.Finish();
 | |
| 
 | |
|             gd.BufferManager.Delete(bufferHandle);
 | |
|         }
 | |
| 
 | |
|         public void DrawTexture(
 | |
|             VulkanRenderer gd,
 | |
|             PipelineBase pipeline,
 | |
|             TextureView src,
 | |
|             ISampler srcSampler,
 | |
|             Extents2DF srcRegion,
 | |
|             Extents2DF dstRegion)
 | |
|         {
 | |
|             const int RegionBufferSize = 16;
 | |
| 
 | |
|             pipeline.SetTextureAndSampler(ShaderStage.Fragment, 0, src, srcSampler);
 | |
| 
 | |
|             Span<float> region = stackalloc float[RegionBufferSize / sizeof(float)];
 | |
| 
 | |
|             region[0] = srcRegion.X1 / src.Width;
 | |
|             region[1] = srcRegion.X2 / src.Width;
 | |
|             region[2] = srcRegion.Y1 / src.Height;
 | |
|             region[3] = srcRegion.Y2 / src.Height;
 | |
| 
 | |
|             if (dstRegion.X1 > dstRegion.X2)
 | |
|             {
 | |
|                 (region[0], region[1]) = (region[1], region[0]);
 | |
|             }
 | |
| 
 | |
|             if (dstRegion.Y1 > dstRegion.Y2)
 | |
|             {
 | |
|                 (region[2], region[3]) = (region[3], region[2]);
 | |
|             }
 | |
| 
 | |
|             var bufferHandle = gd.BufferManager.CreateWithHandle(gd, RegionBufferSize, false);
 | |
| 
 | |
|             gd.BufferManager.SetData<float>(bufferHandle, 0, region);
 | |
| 
 | |
|             pipeline.SetUniformBuffers(1, stackalloc[] { new BufferRange(bufferHandle, 0, RegionBufferSize) });
 | |
| 
 | |
|             Span<GAL.Viewport> viewports = stackalloc GAL.Viewport[1];
 | |
| 
 | |
|             var rect = new Rectangle<float>(
 | |
|                 MathF.Min(dstRegion.X1, dstRegion.X2),
 | |
|                 MathF.Min(dstRegion.Y1, dstRegion.Y2),
 | |
|                 MathF.Abs(dstRegion.X2 - dstRegion.X1),
 | |
|                 MathF.Abs(dstRegion.Y2 - dstRegion.Y1));
 | |
| 
 | |
|             viewports[0] = new GAL.Viewport(
 | |
|                 rect,
 | |
|                 ViewportSwizzle.PositiveX,
 | |
|                 ViewportSwizzle.PositiveY,
 | |
|                 ViewportSwizzle.PositiveZ,
 | |
|                 ViewportSwizzle.PositiveW,
 | |
|                 0f,
 | |
|                 1f);
 | |
| 
 | |
|             Span<Rectangle<int>> scissors = stackalloc Rectangle<int>[1];
 | |
| 
 | |
|             pipeline.SetProgram(_programColorBlit);
 | |
|             pipeline.SetViewports(viewports, false);
 | |
|             pipeline.SetPrimitiveTopology(GAL.PrimitiveTopology.TriangleStrip);
 | |
|             pipeline.Draw(4, 1, 0, 0);
 | |
| 
 | |
|             gd.BufferManager.Delete(bufferHandle);
 | |
|         }
 | |
| 
 | |
|         public unsafe void ConvertI8ToI16(VulkanRenderer gd, CommandBufferScoped cbs, BufferHolder src, BufferHolder dst, int srcOffset, int size)
 | |
|         {
 | |
|             ChangeStride(gd, cbs, src, dst, srcOffset, size, 1, 2);
 | |
|         }
 | |
| 
 | |
|         public unsafe void ChangeStride(VulkanRenderer gd, CommandBufferScoped cbs, BufferHolder src, BufferHolder dst, int srcOffset, int size, int stride, int newStride)
 | |
|         {
 | |
|             bool supportsUint8 = gd.Capabilities.SupportsShaderInt8;
 | |
| 
 | |
|             int elems = size / stride;
 | |
|             int newSize = elems * newStride;
 | |
| 
 | |
|             var srcBufferAuto = src.GetBuffer();
 | |
|             var dstBufferAuto = dst.GetBuffer();
 | |
| 
 | |
|             var srcBuffer = srcBufferAuto.Get(cbs, srcOffset, size).Value;
 | |
|             var dstBuffer = dstBufferAuto.Get(cbs, 0, newSize).Value;
 | |
| 
 | |
|             var access = supportsUint8 ? AccessFlags.AccessShaderWriteBit : AccessFlags.AccessTransferWriteBit;
 | |
|             var stage = supportsUint8 ? PipelineStageFlags.PipelineStageComputeShaderBit : PipelineStageFlags.PipelineStageTransferBit;
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 dstBuffer,
 | |
|                 BufferHolder.DefaultAccessFlags,
 | |
|                 access,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 stage,
 | |
|                 0,
 | |
|                 newSize);
 | |
| 
 | |
|             if (supportsUint8)
 | |
|             {
 | |
|                 const int ParamsBufferSize = 16;
 | |
| 
 | |
|                 Span<int> shaderParams = stackalloc int[ParamsBufferSize / sizeof(int)];
 | |
| 
 | |
|                 shaderParams[0] = stride;
 | |
|                 shaderParams[1] = newStride;
 | |
|                 shaderParams[2] = size;
 | |
|                 shaderParams[3] = srcOffset;
 | |
| 
 | |
|                 var bufferHandle = gd.BufferManager.CreateWithHandle(gd, ParamsBufferSize, false);
 | |
| 
 | |
|                 gd.BufferManager.SetData<int>(bufferHandle, 0, shaderParams);
 | |
| 
 | |
|                 _pipeline.SetCommandBuffer(cbs);
 | |
| 
 | |
|                 _pipeline.SetUniformBuffers(0, stackalloc[] { new BufferRange(bufferHandle, 0, ParamsBufferSize) });
 | |
| 
 | |
|                 Span<Auto<DisposableBuffer>> sbRanges = new Auto<DisposableBuffer>[2];
 | |
| 
 | |
|                 sbRanges[0] = srcBufferAuto;
 | |
|                 sbRanges[1] = dstBufferAuto;
 | |
| 
 | |
|                 _pipeline.SetStorageBuffers(1, sbRanges);
 | |
| 
 | |
|                 _pipeline.SetProgram(_programStrideChange);
 | |
|                 _pipeline.DispatchCompute(1, 1, 1);
 | |
| 
 | |
|                 gd.BufferManager.Delete(bufferHandle);
 | |
| 
 | |
|                 _pipeline.Finish(gd, cbs);
 | |
|             }
 | |
|             else
 | |
|             {
 | |
|                 gd.Api.CmdFillBuffer(cbs.CommandBuffer, dstBuffer, 0, Vk.WholeSize, 0);
 | |
| 
 | |
|                 var bufferCopy = new BufferCopy[elems];
 | |
| 
 | |
|                 for (ulong i = 0; i < (ulong)elems; i++)
 | |
|                 {
 | |
|                     bufferCopy[i] = new BufferCopy((ulong)srcOffset + i * (ulong)stride, i * (ulong)newStride, (ulong)stride);
 | |
|                 }
 | |
| 
 | |
|                 fixed (BufferCopy* pBufferCopy = bufferCopy)
 | |
|                 {
 | |
|                     gd.Api.CmdCopyBuffer(cbs.CommandBuffer, srcBuffer, dstBuffer, (uint)elems, pBufferCopy);
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 dstBuffer,
 | |
|                 access,
 | |
|                 BufferHolder.DefaultAccessFlags,
 | |
|                 stage,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 0,
 | |
|                 newSize);
 | |
|         }
 | |
| 
 | |
|         public unsafe void ConvertIndexBuffer(VulkanRenderer gd,
 | |
|             CommandBufferScoped cbs,
 | |
|             BufferHolder src,
 | |
|             BufferHolder dst,
 | |
|             IndexBufferPattern pattern,
 | |
|             int indexSize,
 | |
|             int srcOffset,
 | |
|             int indexCount)
 | |
|         {
 | |
|             // TODO: Support conversion with primitive restart enabled.
 | |
|             // TODO: Convert with a compute shader?
 | |
| 
 | |
|             int convertedCount = pattern.GetConvertedCount(indexCount);
 | |
|             int outputIndexSize = 4;
 | |
| 
 | |
|             var srcBuffer = src.GetBuffer().Get(cbs, srcOffset, indexCount * indexSize).Value;
 | |
|             var dstBuffer = dst.GetBuffer().Get(cbs, 0, convertedCount * outputIndexSize).Value;
 | |
| 
 | |
|             gd.Api.CmdFillBuffer(cbs.CommandBuffer, dstBuffer, 0, Vk.WholeSize, 0);
 | |
| 
 | |
|             var bufferCopy = new List<BufferCopy>();
 | |
|             int outputOffset = 0;
 | |
| 
 | |
|             // Try to merge copies of adjacent indices to reduce copy count.
 | |
|             int sequenceStart = 0;
 | |
|             int sequenceLength = 0;
 | |
| 
 | |
|             foreach (var index in pattern.GetIndexMapping(indexCount))
 | |
|             {
 | |
|                 if (sequenceLength > 0)
 | |
|                 {
 | |
|                     if (index == sequenceStart + sequenceLength && indexSize == outputIndexSize)
 | |
|                     {
 | |
|                         sequenceLength++;
 | |
|                         continue;
 | |
|                     }
 | |
| 
 | |
|                     // Commit the copy so far.
 | |
|                     bufferCopy.Add(new BufferCopy((ulong)(srcOffset + sequenceStart * indexSize), (ulong)outputOffset, (ulong)(indexSize * sequenceLength)));
 | |
|                     outputOffset += outputIndexSize * sequenceLength;
 | |
|                 }
 | |
| 
 | |
|                 sequenceStart = index;
 | |
|                 sequenceLength = 1;
 | |
|             }
 | |
| 
 | |
|             if (sequenceLength > 0)
 | |
|             {
 | |
|                 // Commit final pending copy.
 | |
|                 bufferCopy.Add(new BufferCopy((ulong)(srcOffset + sequenceStart * indexSize), (ulong)outputOffset, (ulong)(indexSize * sequenceLength)));
 | |
|             }
 | |
| 
 | |
|             var bufferCopyArray = bufferCopy.ToArray();
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 dstBuffer,
 | |
|                 BufferHolder.DefaultAccessFlags,
 | |
|                 AccessFlags.AccessTransferWriteBit,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 PipelineStageFlags.PipelineStageTransferBit,
 | |
|                 0,
 | |
|                 convertedCount * outputIndexSize);
 | |
| 
 | |
|             fixed (BufferCopy* pBufferCopy = bufferCopyArray)
 | |
|             {
 | |
|                 gd.Api.CmdCopyBuffer(cbs.CommandBuffer, srcBuffer, dstBuffer, (uint)bufferCopyArray.Length, pBufferCopy);
 | |
|             }
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 dstBuffer,
 | |
|                 AccessFlags.AccessTransferWriteBit,
 | |
|                 BufferHolder.DefaultAccessFlags,
 | |
|                 PipelineStageFlags.PipelineStageTransferBit,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 0,
 | |
|                 convertedCount * outputIndexSize);
 | |
|         }
 | |
| 
 | |
|         public void CopyMSToNonMS(VulkanRenderer gd, CommandBufferScoped cbs, TextureView src, TextureView dst, int srcLayer, int dstLayer, int depth)
 | |
|         {
 | |
|             CopyMS(gd, cbs, src, dst, srcLayer, dstLayer, depth, src.Info.Samples, dst.Info.Width, dst.Info.Height);
 | |
|         }
 | |
| 
 | |
|         public void CopyNonMSToMS(VulkanRenderer gd, CommandBufferScoped cbs, TextureView src, TextureView dst, int srcLayer, int dstLayer, int depth)
 | |
|         {
 | |
|             CopyMS(gd, cbs, src, dst, srcLayer, dstLayer, depth, dst.Info.Samples, src.Info.Width, src.Info.Height);
 | |
|         }
 | |
| 
 | |
|         private void CopyMS(
 | |
|             VulkanRenderer gd,
 | |
|             CommandBufferScoped cbs,
 | |
|             TextureView src,
 | |
|             TextureView dst,
 | |
|             int srcLayer,
 | |
|             int dstLayer,
 | |
|             int depth,
 | |
|             int samples,
 | |
|             int nonMSWidth,
 | |
|             int nonMSHeight)
 | |
|         {
 | |
|             const int ParamsBufferSize = 16;
 | |
| 
 | |
|             Span<int> shaderParams = stackalloc int[ParamsBufferSize / sizeof(int)];
 | |
| 
 | |
|             // X and Y are the expected texture samples.
 | |
|             // Z and W are the actual texture samples used.
 | |
|             // They may differ if the GPU does not support the samples count requested and we had to use a lower amount.
 | |
|             (shaderParams[0], shaderParams[1]) = GetSampleCountXYLog2(samples);
 | |
|             (shaderParams[2], shaderParams[3]) = GetSampleCountXYLog2((int)TextureStorage.ConvertToSampleCountFlags((uint)samples));
 | |
| 
 | |
|             var bufferHandle = gd.BufferManager.CreateWithHandle(gd, ParamsBufferSize, false);
 | |
| 
 | |
|             gd.BufferManager.SetData<int>(bufferHandle, 0, shaderParams);
 | |
| 
 | |
|             TextureView.InsertImageBarrier(
 | |
|                 gd.Api,
 | |
|                 cbs.CommandBuffer,
 | |
|                 src.GetImage().Get(cbs).Value,
 | |
|                 TextureStorage.DefaultAccessMask,
 | |
|                 AccessFlags.AccessShaderReadBit,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 PipelineStageFlags.PipelineStageComputeShaderBit,
 | |
|                 ImageAspectFlags.ImageAspectColorBit,
 | |
|                 src.FirstLayer + srcLayer,
 | |
|                 src.FirstLevel,
 | |
|                 depth,
 | |
|                 1);
 | |
| 
 | |
|             _pipeline.SetCommandBuffer(cbs);
 | |
| 
 | |
|             _pipeline.SetProgram(_programColorCopyBetweenMsNonMs);
 | |
| 
 | |
|             var format = GetFormat(src.Info.BytesPerPixel);
 | |
| 
 | |
|             int dispatchX = (nonMSWidth + 31) / 32;
 | |
|             int dispatchY = (nonMSHeight + 31) / 32;
 | |
| 
 | |
|             // Specialize shader.
 | |
|             bool srcIsMs = src.Info.Target.IsMultisample();
 | |
|             int conversionType = srcIsMs ? src.Info.BytesPerPixel : -src.Info.BytesPerPixel;
 | |
|             _pipeline.Specialize(conversionType);
 | |
| 
 | |
|             _pipeline.SetUniformBuffers(0, stackalloc[] { new BufferRange(bufferHandle, 0, ParamsBufferSize) });
 | |
| 
 | |
|             if (src.Info.Target == Target.Texture2DMultisampleArray ||
 | |
|                 dst.Info.Target == Target.Texture2DMultisampleArray)
 | |
|             {
 | |
|                 for (int z = 0; z < depth; z++)
 | |
|                 {
 | |
|                     var srcView = Create2DLayerView(src, srcLayer + z, format);
 | |
|                     var dstView = Create2DLayerView(dst, dstLayer + z);
 | |
| 
 | |
|                     _pipeline.SetTextureAndSampler(ShaderStage.Compute, 0, srcView, null);
 | |
|                     _pipeline.SetImage(0, dstView, format);
 | |
| 
 | |
|                     _pipeline.DispatchCompute(dispatchX, dispatchY, 1);
 | |
| 
 | |
|                     srcView.Release();
 | |
|                     dstView.Release();
 | |
|                 }
 | |
|             }
 | |
|             else
 | |
|             {
 | |
|                 var srcView = Create2DLayerView(src, srcLayer, format);
 | |
| 
 | |
|                 _pipeline.SetTextureAndSampler(ShaderStage.Compute, 0, srcView, null);
 | |
|                 _pipeline.SetImage(0, dst, format);
 | |
| 
 | |
|                 _pipeline.DispatchCompute(dispatchX, dispatchY, 1);
 | |
| 
 | |
|                 srcView.Release();
 | |
|             }
 | |
| 
 | |
|             gd.BufferManager.Delete(bufferHandle);
 | |
| 
 | |
|             _pipeline.Finish(gd, cbs);
 | |
| 
 | |
|             TextureView.InsertImageBarrier(
 | |
|                 gd.Api,
 | |
|                 cbs.CommandBuffer,
 | |
|                 dst.GetImage().Get(cbs).Value,
 | |
|                 AccessFlags.AccessShaderWriteBit,
 | |
|                 TextureStorage.DefaultAccessMask,
 | |
|                 PipelineStageFlags.PipelineStageComputeShaderBit,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 ImageAspectFlags.ImageAspectColorBit,
 | |
|                 dst.FirstLayer + dstLayer,
 | |
|                 dst.FirstLevel,
 | |
|                 depth,
 | |
|                 1);
 | |
|         }
 | |
| 
 | |
|         private static (int, int) GetSampleCountXYLog2(int samples)
 | |
|         {
 | |
|             int samplesInXLog2 = 0;
 | |
|             int samplesInYLog2 = 0;
 | |
| 
 | |
|             switch (samples)
 | |
|             {
 | |
|                 case 2: // 2x1
 | |
|                     samplesInXLog2 = 1;
 | |
|                     break;
 | |
|                 case 4: // 2x2
 | |
|                     samplesInXLog2 = 1;
 | |
|                     samplesInYLog2 = 1;
 | |
|                     break;
 | |
|                 case 8: // 4x2
 | |
|                     samplesInXLog2 = 2;
 | |
|                     samplesInYLog2 = 1;
 | |
|                     break;
 | |
|                 case 16: // 4x4
 | |
|                     samplesInXLog2 = 2;
 | |
|                     samplesInYLog2 = 2;
 | |
|                     break;
 | |
|                 case 32: // 8x4
 | |
|                     samplesInXLog2 = 3;
 | |
|                     samplesInYLog2 = 2;
 | |
|                     break;
 | |
|                 case 64: // 8x8
 | |
|                     samplesInXLog2 = 3;
 | |
|                     samplesInYLog2 = 3;
 | |
|                     break;
 | |
|             }
 | |
| 
 | |
|             return (samplesInXLog2, samplesInYLog2);
 | |
|         }
 | |
| 
 | |
|         private static ITexture Create2DLayerView(TextureView from, int layer, GAL.Format? format = null)
 | |
|         {
 | |
|             var target = from.Info.Target switch
 | |
|             {
 | |
|                 Target.Texture1DArray => Target.Texture1D,
 | |
|                 Target.Texture2DArray => Target.Texture2D,
 | |
|                 Target.Texture2DMultisampleArray => Target.Texture2DMultisample,
 | |
|                 _ => from.Info.Target
 | |
|             };
 | |
| 
 | |
|             var info = new TextureCreateInfo(
 | |
|                 from.Info.Width,
 | |
|                 from.Info.Height,
 | |
|                 from.Info.Depth,
 | |
|                 1,
 | |
|                 from.Info.Samples,
 | |
|                 from.Info.BlockWidth,
 | |
|                 from.Info.BlockHeight,
 | |
|                 from.Info.BytesPerPixel,
 | |
|                 format ?? from.Info.Format,
 | |
|                 from.Info.DepthStencilMode,
 | |
|                 target,
 | |
|                 from.Info.SwizzleR,
 | |
|                 from.Info.SwizzleG,
 | |
|                 from.Info.SwizzleB,
 | |
|                 from.Info.SwizzleA);
 | |
| 
 | |
|             return from.CreateView(info, layer, 0);
 | |
|         }
 | |
| 
 | |
|         private static GAL.Format GetFormat(int bytesPerPixel)
 | |
|         {
 | |
|             return bytesPerPixel switch
 | |
|             {
 | |
|                 1 => GAL.Format.R8Uint,
 | |
|                 2 => GAL.Format.R16Uint,
 | |
|                 4 => GAL.Format.R32Uint,
 | |
|                 8 => GAL.Format.R32G32Uint,
 | |
|                 16 => GAL.Format.R32G32B32A32Uint,
 | |
|                 _ => throw new ArgumentException($"Invalid bytes per pixel {bytesPerPixel}.")
 | |
|             };
 | |
|         }
 | |
| 
 | |
|         public void ConvertIndexBufferIndirect(
 | |
|             VulkanRenderer gd,
 | |
|             CommandBufferScoped cbs,
 | |
|             BufferHolder srcIndirectBuffer,
 | |
|             BufferHolder dstIndirectBuffer,
 | |
|             BufferRange drawCountBuffer,
 | |
|             BufferHolder srcIndexBuffer,
 | |
|             BufferHolder dstIndexBuffer,
 | |
|             IndexBufferPattern pattern,
 | |
|             int indexSize,
 | |
|             int srcIndexBufferOffset,
 | |
|             int srcIndexBufferSize,
 | |
|             int srcIndirectBufferOffset,
 | |
|             bool hasDrawCount,
 | |
|             int maxDrawCount,
 | |
|             int indirectDataStride)
 | |
|         {
 | |
|             // TODO: Support conversion with primitive restart enabled.
 | |
| 
 | |
|             BufferRange drawCountBufferAligned = new BufferRange(
 | |
|                 drawCountBuffer.Handle,
 | |
|                 drawCountBuffer.Offset & ~(UniformBufferAlignment - 1),
 | |
|                 UniformBufferAlignment);
 | |
| 
 | |
|             int indirectDataSize = maxDrawCount * indirectDataStride;
 | |
| 
 | |
|             int indexCount = srcIndexBufferSize / indexSize;
 | |
|             int primitivesCount = pattern.GetPrimitiveCount(indexCount);
 | |
|             int convertedCount = pattern.GetConvertedCount(indexCount);
 | |
|             int outputIndexSize = 4;
 | |
| 
 | |
|             var srcBuffer = srcIndexBuffer.GetBuffer().Get(cbs, srcIndexBufferOffset, indexCount * indexSize).Value;
 | |
|             var dstBuffer = dstIndexBuffer.GetBuffer().Get(cbs, 0, convertedCount * outputIndexSize).Value;
 | |
| 
 | |
|             const int ParamsBufferSize = 24 * sizeof(int);
 | |
|             const int ParamsIndirectDispatchOffset = 16 * sizeof(int);
 | |
|             const int ParamsIndirectDispatchSize = 3 * sizeof(int);
 | |
| 
 | |
|             Span<int> shaderParams = stackalloc int[ParamsBufferSize / sizeof(int)];
 | |
| 
 | |
|             shaderParams[8] = pattern.PrimitiveVertices;
 | |
|             shaderParams[9] = pattern.PrimitiveVerticesOut;
 | |
|             shaderParams[10] = indexSize;
 | |
|             shaderParams[11] = outputIndexSize;
 | |
|             shaderParams[12] = pattern.BaseIndex;
 | |
|             shaderParams[13] = pattern.IndexStride;
 | |
|             shaderParams[14] = srcIndexBufferOffset;
 | |
|             shaderParams[15] = primitivesCount;
 | |
|             shaderParams[16] = 1;
 | |
|             shaderParams[17] = 1;
 | |
|             shaderParams[18] = 1;
 | |
|             shaderParams[19] = hasDrawCount ? 1 : 0;
 | |
|             shaderParams[20] = maxDrawCount;
 | |
|             shaderParams[21] = (drawCountBuffer.Offset & (UniformBufferAlignment - 1)) / 4;
 | |
|             shaderParams[22] = indirectDataStride / 4;
 | |
|             shaderParams[23] = srcIndirectBufferOffset / 4;
 | |
| 
 | |
|             pattern.OffsetIndex.CopyTo(shaderParams.Slice(0, pattern.OffsetIndex.Length));
 | |
| 
 | |
|             var patternBufferHandle = gd.BufferManager.CreateWithHandle(gd, ParamsBufferSize, false, out var patternBuffer);
 | |
|             var patternBufferAuto = patternBuffer.GetBuffer();
 | |
| 
 | |
|             gd.BufferManager.SetData<int>(patternBufferHandle, 0, shaderParams);
 | |
| 
 | |
|             _pipeline.SetCommandBuffer(cbs);
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 srcIndirectBuffer.GetBuffer().Get(cbs, srcIndirectBufferOffset, indirectDataSize).Value,
 | |
|                 BufferHolder.DefaultAccessFlags,
 | |
|                 AccessFlags.AccessShaderReadBit,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 PipelineStageFlags.PipelineStageComputeShaderBit,
 | |
|                 srcIndirectBufferOffset,
 | |
|                 indirectDataSize);
 | |
| 
 | |
|             _pipeline.SetUniformBuffers(0, stackalloc[] { drawCountBufferAligned });
 | |
|             _pipeline.SetStorageBuffers(1, new[] { srcIndirectBuffer.GetBuffer(), dstIndirectBuffer.GetBuffer(), patternBuffer.GetBuffer() });
 | |
| 
 | |
|             _pipeline.SetProgram(_programConvertIndirectData);
 | |
|             _pipeline.DispatchCompute(1, 1, 1);
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 patternBufferAuto.Get(cbs, ParamsIndirectDispatchOffset, ParamsIndirectDispatchSize).Value,
 | |
|                 AccessFlags.AccessShaderWriteBit,
 | |
|                 AccessFlags.AccessIndirectCommandReadBit,
 | |
|                 PipelineStageFlags.PipelineStageComputeShaderBit,
 | |
|                 PipelineStageFlags.PipelineStageDrawIndirectBit,
 | |
|                 ParamsIndirectDispatchOffset,
 | |
|                 ParamsIndirectDispatchSize);
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 dstBuffer,
 | |
|                 BufferHolder.DefaultAccessFlags,
 | |
|                 AccessFlags.AccessTransferWriteBit,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 PipelineStageFlags.PipelineStageTransferBit,
 | |
|                 0,
 | |
|                 convertedCount * outputIndexSize);
 | |
| 
 | |
|             _pipeline.SetUniformBuffers(0, stackalloc[] { new BufferRange(patternBufferHandle, 0, ParamsBufferSize) });
 | |
|             _pipeline.SetStorageBuffers(1, new[] { srcIndexBuffer.GetBuffer(), dstIndexBuffer.GetBuffer() });
 | |
| 
 | |
|             _pipeline.SetProgram(_programConvertIndexBuffer);
 | |
|             _pipeline.DispatchComputeIndirect(patternBufferAuto, ParamsIndirectDispatchOffset);
 | |
| 
 | |
|             BufferHolder.InsertBufferBarrier(
 | |
|                 gd,
 | |
|                 cbs.CommandBuffer,
 | |
|                 dstBuffer,
 | |
|                 AccessFlags.AccessTransferWriteBit,
 | |
|                 BufferHolder.DefaultAccessFlags,
 | |
|                 PipelineStageFlags.PipelineStageTransferBit,
 | |
|                 PipelineStageFlags.PipelineStageAllCommandsBit,
 | |
|                 0,
 | |
|                 convertedCount * outputIndexSize);
 | |
| 
 | |
|             gd.BufferManager.Delete(patternBufferHandle);
 | |
| 
 | |
|             _pipeline.Finish(gd, cbs);
 | |
|         }
 | |
| 
 | |
|         protected virtual void Dispose(bool disposing)
 | |
|         {
 | |
|             if (disposing)
 | |
|             {
 | |
|                 _programColorBlitClearAlpha.Dispose();
 | |
|                 _programColorBlit.Dispose();
 | |
|                 _programColorClear.Dispose();
 | |
|                 _programStrideChange.Dispose();
 | |
|                 _programColorCopyBetweenMsNonMs.Dispose();
 | |
|                 _programConvertIndexBuffer.Dispose();
 | |
|                 _programConvertIndirectData.Dispose();
 | |
|                 _samplerNearest.Dispose();
 | |
|                 _samplerLinear.Dispose();
 | |
|                 _pipeline.Dispose();
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         public void Dispose()
 | |
|         {
 | |
|             Dispose(true);
 | |
|         }
 | |
|     }
 | |
| }
 |