forked from Mirror/Ryujinx
dff138229c
* amadeus: Allow OOB read of GC-ADPCM coefficients Fixes "Ninja Gaiden Sigma 2" and possibly "NINJA GAIDEN 3: Razor's Edge" * amadeus: Fix wrong variable usage in delay effect We should transform the delay line values, not the input. * amadeus: Update GroupedBiquadFilterCommand documentation * amadeus: Simplify PoolMapper alignment checks * amadeus: Update Surround delay effect matrix to REV11 * amadeus: Add drop parameter support and use 32 bits integers for estimate time Also implement accurate ExecuteAudioRendererRendering stub. * Address gdkchan's comments * Address gdkchan's other comments * Address gdkchan's comment
137 lines
No EOL
4.7 KiB
C#
137 lines
No EOL
4.7 KiB
C#
using System;
|
|
using System.Runtime.CompilerServices;
|
|
using System.Runtime.InteropServices;
|
|
using System.Runtime.Intrinsics;
|
|
using System.Runtime.Intrinsics.Arm;
|
|
using System.Runtime.Intrinsics.X86;
|
|
|
|
namespace Ryujinx.Audio.Renderer.Dsp.Command
|
|
{
|
|
public class MixCommand : ICommand
|
|
{
|
|
public bool Enabled { get; set; }
|
|
|
|
public int NodeId { get; }
|
|
|
|
public CommandType CommandType => CommandType.Mix;
|
|
|
|
public uint EstimatedProcessingTime { get; set; }
|
|
|
|
public ushort InputBufferIndex { get; }
|
|
public ushort OutputBufferIndex { get; }
|
|
|
|
public float Volume { get; }
|
|
|
|
public MixCommand(uint inputBufferIndex, uint outputBufferIndex, int nodeId, float volume)
|
|
{
|
|
Enabled = true;
|
|
NodeId = nodeId;
|
|
|
|
InputBufferIndex = (ushort)inputBufferIndex;
|
|
OutputBufferIndex = (ushort)outputBufferIndex;
|
|
|
|
Volume = volume;
|
|
}
|
|
|
|
[MethodImpl(MethodImplOptions.AggressiveInlining)]
|
|
private void ProcessMixAvx(Span<float> outputMix, ReadOnlySpan<float> inputMix)
|
|
{
|
|
Vector256<float> volumeVec = Vector256.Create(Volume);
|
|
|
|
ReadOnlySpan<Vector256<float>> inputVec = MemoryMarshal.Cast<float, Vector256<float>>(inputMix);
|
|
Span<Vector256<float>> outputVec = MemoryMarshal.Cast<float, Vector256<float>>(outputMix);
|
|
|
|
int sisdStart = inputVec.Length * 8;
|
|
|
|
for (int i = 0; i < inputVec.Length; i++)
|
|
{
|
|
outputVec[i] = Avx.Add(outputVec[i], Avx.Ceiling(Avx.Multiply(inputVec[i], volumeVec)));
|
|
}
|
|
|
|
for (int i = sisdStart; i < inputMix.Length; i++)
|
|
{
|
|
outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume);
|
|
}
|
|
}
|
|
|
|
[MethodImpl(MethodImplOptions.AggressiveInlining)]
|
|
private void ProcessMixSse41(Span<float> outputMix, ReadOnlySpan<float> inputMix)
|
|
{
|
|
Vector128<float> volumeVec = Vector128.Create(Volume);
|
|
|
|
ReadOnlySpan<Vector128<float>> inputVec = MemoryMarshal.Cast<float, Vector128<float>>(inputMix);
|
|
Span<Vector128<float>> outputVec = MemoryMarshal.Cast<float, Vector128<float>>(outputMix);
|
|
|
|
int sisdStart = inputVec.Length * 4;
|
|
|
|
for (int i = 0; i < inputVec.Length; i++)
|
|
{
|
|
outputVec[i] = Sse.Add(outputVec[i], Sse41.Ceiling(Sse.Multiply(inputVec[i], volumeVec)));
|
|
}
|
|
|
|
for (int i = sisdStart; i < inputMix.Length; i++)
|
|
{
|
|
outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume);
|
|
}
|
|
}
|
|
|
|
[MethodImpl(MethodImplOptions.AggressiveInlining)]
|
|
private void ProcessMixAdvSimd(Span<float> outputMix, ReadOnlySpan<float> inputMix)
|
|
{
|
|
Vector128<float> volumeVec = Vector128.Create(Volume);
|
|
|
|
ReadOnlySpan<Vector128<float>> inputVec = MemoryMarshal.Cast<float, Vector128<float>>(inputMix);
|
|
Span<Vector128<float>> outputVec = MemoryMarshal.Cast<float, Vector128<float>>(outputMix);
|
|
|
|
int sisdStart = inputVec.Length * 4;
|
|
|
|
for (int i = 0; i < inputVec.Length; i++)
|
|
{
|
|
outputVec[i] = AdvSimd.Add(outputVec[i], AdvSimd.Ceiling(AdvSimd.Multiply(inputVec[i], volumeVec)));
|
|
}
|
|
|
|
for (int i = sisdStart; i < inputMix.Length; i++)
|
|
{
|
|
outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume);
|
|
}
|
|
}
|
|
|
|
[MethodImpl(MethodImplOptions.AggressiveInlining)]
|
|
private void ProcessMixSlowPath(Span<float> outputMix, ReadOnlySpan<float> inputMix)
|
|
{
|
|
for (int i = 0; i < inputMix.Length; i++)
|
|
{
|
|
outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume);
|
|
}
|
|
}
|
|
|
|
[MethodImpl(MethodImplOptions.AggressiveInlining)]
|
|
private void ProcessMix(Span<float> outputMix, ReadOnlySpan<float> inputMix)
|
|
{
|
|
if (Avx.IsSupported)
|
|
{
|
|
ProcessMixAvx(outputMix, inputMix);
|
|
}
|
|
else if (Sse41.IsSupported)
|
|
{
|
|
ProcessMixSse41(outputMix, inputMix);
|
|
}
|
|
else if (AdvSimd.IsSupported)
|
|
{
|
|
ProcessMixAdvSimd(outputMix, inputMix);
|
|
}
|
|
else
|
|
{
|
|
ProcessMixSlowPath(outputMix, inputMix);
|
|
}
|
|
}
|
|
|
|
public void Process(CommandList context)
|
|
{
|
|
ReadOnlySpan<float> inputBuffer = context.GetBuffer(InputBufferIndex);
|
|
Span<float> outputBuffer = context.GetBuffer(OutputBufferIndex);
|
|
|
|
ProcessMix(outputBuffer, inputBuffer);
|
|
}
|
|
}
|
|
} |