 edfd4d70c0
			
		
	
	
		edfd4d70c0
		
			
		
	
	
	
	
		
			
			* Use SIMD acceleration for audio upsampler filter kernel for a moderate speedup * Address formatting. Implement AVX2 fast path for high quality resampling in ResamplerHelper * now really, are we really getting the benefit of inlining 50+ line methods? * adding unit tests for resampler + upsampler. The upsampler ones fail for some reason * Fixing upsampler test. Apparently this algo only works at specific ratios --------- Co-authored-by: Logan Stromberg <lostromb@microsoft.com>
		
			
				
	
	
		
			192 lines
		
	
	
		
			No EOL
		
	
	
		
			7.5 KiB
		
	
	
	
		
			C#
		
	
	
	
	
	
			
		
		
	
	
			192 lines
		
	
	
		
			No EOL
		
	
	
		
			7.5 KiB
		
	
	
	
		
			C#
		
	
	
	
	
	
| using Ryujinx.Audio.Renderer.Server.Upsampler;
 | |
| using Ryujinx.Common.Memory;
 | |
| using System;
 | |
| using System.Diagnostics;
 | |
| using System.Numerics;
 | |
| using System.Runtime.CompilerServices;
 | |
| 
 | |
| namespace Ryujinx.Audio.Renderer.Dsp
 | |
| {
 | |
|     public class UpsamplerHelper
 | |
|     {
 | |
|         private const int HistoryLength = UpsamplerBufferState.HistoryLength;
 | |
|         private const int FilterBankLength = 20;
 | |
|         // Bank0 = [0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0];
 | |
|         private const int Bank0CenterIndex = 9;
 | |
|         private static readonly Array20<float> Bank1 = PrecomputeFilterBank(1.0f / 6.0f);
 | |
|         private static readonly Array20<float> Bank2 = PrecomputeFilterBank(2.0f / 6.0f);
 | |
|         private static readonly Array20<float> Bank3 = PrecomputeFilterBank(3.0f / 6.0f);
 | |
|         private static readonly Array20<float> Bank4 = PrecomputeFilterBank(4.0f / 6.0f);
 | |
|         private static readonly Array20<float> Bank5 = PrecomputeFilterBank(5.0f / 6.0f);
 | |
| 
 | |
|         private static Array20<float> PrecomputeFilterBank(float offset)
 | |
|         {
 | |
|             float Sinc(float x)
 | |
|             {
 | |
|                 if (x == 0)
 | |
|                 {
 | |
|                     return 1.0f;
 | |
|                 }
 | |
|                 return (MathF.Sin(MathF.PI * x) / (MathF.PI * x));
 | |
|             }
 | |
| 
 | |
|             float BlackmanWindow(float x)
 | |
|             {
 | |
|                 const float a = 0.18f;
 | |
|                 const float a0 = 0.5f - 0.5f * a;
 | |
|                 const float a1 = -0.5f;
 | |
|                 const float a2 = 0.5f * a;
 | |
|                 return a0 + a1 * MathF.Cos(2 * MathF.PI * x) + a2 * MathF.Cos(4 * MathF.PI * x);
 | |
|             }
 | |
|             
 | |
|             Array20<float> result = new Array20<float>();
 | |
| 
 | |
|             for (int i = 0; i < FilterBankLength; i++)
 | |
|             {
 | |
|                 float x = (Bank0CenterIndex - i) + offset;
 | |
|                 result[i] = Sinc(x) * BlackmanWindow(x / FilterBankLength + 0.5f);
 | |
|             }
 | |
| 
 | |
|             return result;
 | |
|         }
 | |
| 
 | |
|         // Polyphase upsampling algorithm
 | |
|         [MethodImpl(MethodImplOptions.AggressiveInlining)]
 | |
|         public static void Upsample(Span<float> outputBuffer, ReadOnlySpan<float> inputBuffer, int outputSampleCount, int inputSampleCount, ref UpsamplerBufferState state)
 | |
|         {
 | |
|             if (!state.Initialized)
 | |
|             {
 | |
|                 state.Scale = inputSampleCount switch
 | |
|                 {
 | |
|                     40  => 6.0f,
 | |
|                     80  => 3.0f,
 | |
|                     160 => 1.5f,
 | |
|                     _   => throw new ArgumentOutOfRangeException()
 | |
|                 };
 | |
|                 state.Initialized = true;
 | |
|             }
 | |
| 
 | |
|             if (outputSampleCount == 0)
 | |
|             {
 | |
|                 return;
 | |
|             }
 | |
| 
 | |
|             float DoFilterBank(ref UpsamplerBufferState state, in Array20<float> bank)
 | |
|             {
 | |
|                 float result = 0.0f;
 | |
| 
 | |
|                 Debug.Assert(state.History.Length == HistoryLength);
 | |
|                 Debug.Assert(bank.Length == FilterBankLength);
 | |
| 
 | |
|                 int curIdx = 0;
 | |
|                 if (Vector.IsHardwareAccelerated)
 | |
|                 {
 | |
|                     // Do SIMD-accelerated block operations where possible.
 | |
|                     // Only about a 2x speedup since filter bank length is short
 | |
|                     int stopIdx = FilterBankLength - (FilterBankLength % Vector<float>.Count);
 | |
|                     while (curIdx < stopIdx)
 | |
|                     {
 | |
|                         result += Vector.Dot(
 | |
|                             new Vector<float>(bank.AsSpan().Slice(curIdx, Vector<float>.Count)),
 | |
|                             new Vector<float>(state.History.AsSpan().Slice(curIdx, Vector<float>.Count)));
 | |
|                         curIdx += Vector<float>.Count;
 | |
|                     }
 | |
|                 }
 | |
| 
 | |
|                 while (curIdx < FilterBankLength)
 | |
|                 {
 | |
|                     result += bank[curIdx] * state.History[curIdx];
 | |
|                     curIdx++;
 | |
|                 }
 | |
| 
 | |
|                 return result;
 | |
|             }
 | |
| 
 | |
|             [MethodImpl(MethodImplOptions.AggressiveInlining)]
 | |
|             void NextInput(ref UpsamplerBufferState state, float input)
 | |
|             {
 | |
|                 state.History.AsSpan().Slice(1).CopyTo(state.History.AsSpan());
 | |
|                 state.History[HistoryLength - 1] = input;
 | |
|             }
 | |
| 
 | |
|             int inputBufferIndex = 0;
 | |
| 
 | |
|             switch (state.Scale)
 | |
|             { 
 | |
|                 case 6.0f:
 | |
|                     for (int i = 0; i < outputSampleCount; i++)
 | |
|                     {
 | |
|                         switch (state.Phase)
 | |
|                         {
 | |
|                             case 0:
 | |
|                                 NextInput(ref state, inputBuffer[inputBufferIndex++]);
 | |
|                                 outputBuffer[i] = state.History[Bank0CenterIndex];
 | |
|                                 break;
 | |
|                             case 1:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank1);
 | |
|                                 break;
 | |
|                             case 2:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank2);
 | |
|                                 break;
 | |
|                             case 3:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank3);
 | |
|                                 break;
 | |
|                             case 4:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank4);
 | |
|                                 break;
 | |
|                             case 5:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank5);
 | |
|                                 break;
 | |
|                         }
 | |
| 
 | |
|                         state.Phase = (state.Phase + 1) % 6;
 | |
|                     }
 | |
|                     break;
 | |
|                 case 3.0f:
 | |
|                     for (int i = 0; i < outputSampleCount; i++)
 | |
|                     {
 | |
|                         switch (state.Phase)
 | |
|                         {
 | |
|                             case 0:
 | |
|                                 NextInput(ref state, inputBuffer[inputBufferIndex++]);
 | |
|                                 outputBuffer[i] = state.History[Bank0CenterIndex];
 | |
|                                 break;
 | |
|                             case 1:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank2);
 | |
|                                 break;
 | |
|                             case 2:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank4);
 | |
|                                 break;
 | |
|                         }
 | |
| 
 | |
|                         state.Phase = (state.Phase + 1) % 3;
 | |
|                     }
 | |
|                     break;
 | |
|                 case 1.5f:
 | |
|                     // Upsample by 3 then decimate by 2.
 | |
|                     for (int i = 0; i < outputSampleCount; i++)
 | |
|                     {
 | |
|                         switch (state.Phase)
 | |
|                         {
 | |
|                             case 0:
 | |
|                                 NextInput(ref state, inputBuffer[inputBufferIndex++]);
 | |
|                                 outputBuffer[i] = state.History[Bank0CenterIndex];
 | |
|                                 break;
 | |
|                             case 1:
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank4);
 | |
|                                 break;
 | |
|                             case 2:
 | |
|                                 NextInput(ref state, inputBuffer[inputBufferIndex++]);
 | |
|                                 outputBuffer[i] = DoFilterBank(ref state, Bank2);
 | |
|                                 break;
 | |
|                         }
 | |
| 
 | |
|                         state.Phase = (state.Phase + 1) % 3;
 | |
|                     }
 | |
|                     break;
 | |
|                 default:
 | |
|                     throw new ArgumentOutOfRangeException();
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| } |