// // Copyright (c) 2019-2021 Ryujinx // // This program is free software: you can redistribute it and/or modify // it under the terms of the GNU Lesser General Public License as published by // the Free Software Foundation, either version 3 of the License, or // (at your option) any later version. // // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public License // along with this program. If not, see . // using System; using System.Runtime.CompilerServices; using System.Runtime.InteropServices; using System.Runtime.Intrinsics; using System.Runtime.Intrinsics.Arm; using System.Runtime.Intrinsics.X86; namespace Ryujinx.Audio.Renderer.Dsp.Command { public class MixCommand : ICommand { public bool Enabled { get; set; } public int NodeId { get; } public CommandType CommandType => CommandType.Mix; public ulong EstimatedProcessingTime { get; set; } public ushort InputBufferIndex { get; } public ushort OutputBufferIndex { get; } public float Volume { get; } public MixCommand(uint inputBufferIndex, uint outputBufferIndex, int nodeId, float volume) { Enabled = true; NodeId = nodeId; InputBufferIndex = (ushort)inputBufferIndex; OutputBufferIndex = (ushort)outputBufferIndex; Volume = volume; } private void ProcessMixAvx(Span outputMix, ReadOnlySpan inputMix) { Vector256 volumeVec = Vector256.Create(Volume); ReadOnlySpan> inputVec = MemoryMarshal.Cast>(inputMix); Span> outputVec = MemoryMarshal.Cast>(outputMix); int sisdStart = inputVec.Length * 8; for (int i = 0; i < inputVec.Length; i++) { outputVec[i] = Avx.Add(outputVec[i], Avx.Ceiling(Avx.Multiply(inputVec[i], volumeVec))); } for (int i = sisdStart; i < inputMix.Length; i++) { outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume); } } private void ProcessMixSse41(Span outputMix, ReadOnlySpan inputMix) { Vector128 volumeVec = Vector128.Create(Volume); ReadOnlySpan> inputVec = MemoryMarshal.Cast>(inputMix); Span> outputVec = MemoryMarshal.Cast>(outputMix); int sisdStart = inputVec.Length * 4; for (int i = 0; i < inputVec.Length; i++) { outputVec[i] = Sse.Add(outputVec[i], Sse41.Ceiling(Sse.Multiply(inputVec[i], volumeVec))); } for (int i = sisdStart; i < inputMix.Length; i++) { outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume); } } [MethodImpl(MethodImplOptions.AggressiveInlining)] private void ProcessMixAdvSimd(Span outputMix, ReadOnlySpan inputMix) { Vector128 volumeVec = Vector128.Create(Volume); ReadOnlySpan> inputVec = MemoryMarshal.Cast>(inputMix); Span> outputVec = MemoryMarshal.Cast>(outputMix); int sisdStart = inputVec.Length * 4; for (int i = 0; i < inputVec.Length; i++) { outputVec[i] = AdvSimd.Add(outputVec[i], AdvSimd.Ceiling(AdvSimd.Multiply(inputVec[i], volumeVec))); } for (int i = sisdStart; i < inputMix.Length; i++) { outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume); } } [MethodImpl(MethodImplOptions.AggressiveInlining)] private void ProcessMixSlowPath(Span outputMix, ReadOnlySpan inputMix) { for (int i = 0; i < inputMix.Length; i++) { outputMix[i] += FloatingPointHelper.MultiplyRoundUp(inputMix[i], Volume); } } private void ProcessMix(Span outputMix, ReadOnlySpan inputMix) { if (Avx.IsSupported) { ProcessMixAvx(outputMix, inputMix); } else if (Sse41.IsSupported) { ProcessMixSse41(outputMix, inputMix); } else if (AdvSimd.IsSupported) { ProcessMixAdvSimd(outputMix, inputMix); } else { ProcessMixSlowPath(outputMix, inputMix); } } public void Process(CommandList context) { ReadOnlySpan inputBuffer = context.GetBuffer(InputBufferIndex); Span outputBuffer = context.GetBuffer(OutputBufferIndex); ProcessMix(outputBuffer, inputBuffer); } } }