// // Copyright (c) 2019-2021 Ryujinx // // This program is free software: you can redistribute it and/or modify // it under the terms of the GNU Lesser General Public License as published by // the Free Software Foundation, either version 3 of the License, or // (at your option) any later version. // // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU Lesser General Public License for more details. // // You should have received a copy of the GNU Lesser General Public License // along with this program. If not, see . // using System; using System.Runtime.CompilerServices; using System.Runtime.InteropServices; using System.Runtime.Intrinsics; using System.Runtime.Intrinsics.Arm; using System.Runtime.Intrinsics.X86; namespace Ryujinx.Audio.Renderer.Dsp.Command { public class VolumeCommand : ICommand { public bool Enabled { get; set; } public int NodeId { get; } public CommandType CommandType => CommandType.Volume; public ulong EstimatedProcessingTime { get; set; } public ushort InputBufferIndex { get; } public ushort OutputBufferIndex { get; } public float Volume { get; } public VolumeCommand(float volume, uint bufferIndex, int nodeId) { Enabled = true; NodeId = nodeId; InputBufferIndex = (ushort)bufferIndex; OutputBufferIndex = (ushort)bufferIndex; Volume = volume; } private void ProcessVolumeAvx(Span outputBuffer, ReadOnlySpan inputBuffer) { Vector256 volumeVec = Vector256.Create(Volume); ReadOnlySpan> inputVec = MemoryMarshal.Cast>(inputBuffer); Span> outputVec = MemoryMarshal.Cast>(outputBuffer); int sisdStart = inputVec.Length * 8; for (int i = 0; i < inputVec.Length; i++) { outputVec[i] = Avx.Ceiling(Avx.Multiply(inputVec[i], volumeVec)); } for (int i = sisdStart; i < inputBuffer.Length; i++) { outputBuffer[i] = FloatingPointHelper.MultiplyRoundUp(inputBuffer[i], Volume); } } private void ProcessVolumeSse41(Span outputBuffer, ReadOnlySpan inputBuffer) { Vector128 volumeVec = Vector128.Create(Volume); ReadOnlySpan> inputVec = MemoryMarshal.Cast>(inputBuffer); Span> outputVec = MemoryMarshal.Cast>(outputBuffer); int sisdStart = inputVec.Length * 4; for (int i = 0; i < inputVec.Length; i++) { outputVec[i] = Sse41.Ceiling(Sse.Multiply(inputVec[i], volumeVec)); } for (int i = sisdStart; i < inputBuffer.Length; i++) { outputBuffer[i] = FloatingPointHelper.MultiplyRoundUp(inputBuffer[i], Volume); } } private void ProcessVolumeAdvSimd(Span outputBuffer, ReadOnlySpan inputBuffer) { Vector128 volumeVec = Vector128.Create(Volume); ReadOnlySpan> inputVec = MemoryMarshal.Cast>(inputBuffer); Span> outputVec = MemoryMarshal.Cast>(outputBuffer); int sisdStart = inputVec.Length * 4; for (int i = 0; i < inputVec.Length; i++) { outputVec[i] = AdvSimd.Ceiling(AdvSimd.Multiply(inputVec[i], volumeVec)); } for (int i = sisdStart; i < inputBuffer.Length; i++) { outputBuffer[i] = FloatingPointHelper.MultiplyRoundUp(inputBuffer[i], Volume); } } private void ProcessVolume(Span outputBuffer, ReadOnlySpan inputBuffer) { if (Avx.IsSupported) { ProcessVolumeAvx(outputBuffer, inputBuffer); } else if (Sse41.IsSupported) { ProcessVolumeSse41(outputBuffer, inputBuffer); } else if (AdvSimd.IsSupported) { ProcessVolumeAdvSimd(outputBuffer, inputBuffer); } else { ProcessVolumeSlowPath(outputBuffer, inputBuffer); } } [MethodImpl(MethodImplOptions.AggressiveInlining)] private void ProcessVolumeSlowPath(Span outputBuffer, ReadOnlySpan inputBuffer) { for (int i = 0; i < outputBuffer.Length; i++) { outputBuffer[i] = FloatingPointHelper.MultiplyRoundUp(inputBuffer[i], Volume); } } public void Process(CommandList context) { ReadOnlySpan inputBuffer = context.GetBuffer(InputBufferIndex); Span outputBuffer = context.GetBuffer(OutputBufferIndex); ProcessVolume(outputBuffer, inputBuffer); } } }