8a33e884f8
* Fix Vnmls_S fast path (F64: losing input d value). Fix Vnmla_S & Vnmls_S slow paths (using fused inst.s). Add Vfma_S & Vfms_S Fma fast paths. Add Vfnma_S inst. with Fma/Sse fast paths and slow path. Add Vfnms_S Sse fast path. Add Tests for affected inst.s. Nits. * InternalVersion = 1775 * Nits. * Fix Vfma_V slow path not using StandardFPSCRValue(). * Nit: Fix Vfma_V order. * Add Vfms_V Sse fast path and slow path. * Add Vfma_V and Vfms_V Test.
264 lines
10 KiB
C#
264 lines
10 KiB
C#
#define SimdCvt32
|
|
|
|
using ARMeilleure.State;
|
|
using NUnit.Framework;
|
|
using System;
|
|
using System.Collections.Generic;
|
|
|
|
namespace Ryujinx.Tests.Cpu
|
|
{
|
|
[Category("SimdCvt32")]
|
|
public sealed class CpuTestSimdCvt32 : CpuTest32
|
|
{
|
|
#if SimdCvt32
|
|
|
|
#region "ValueSource (Opcodes)"
|
|
#endregion
|
|
|
|
#region "ValueSource (Types)"
|
|
private static uint[] _1S_()
|
|
{
|
|
return new uint[] { 0x00000000u, 0x7FFFFFFFu,
|
|
0x80000000u, 0xFFFFFFFFu };
|
|
}
|
|
|
|
private static IEnumerable<ulong> _1S_F_()
|
|
{
|
|
yield return 0x00000000FF7FFFFFul; // -Max Normal (float.MinValue)
|
|
yield return 0x0000000080800000ul; // -Min Normal
|
|
yield return 0x00000000807FFFFFul; // -Max Subnormal
|
|
yield return 0x0000000080000001ul; // -Min Subnormal (-float.Epsilon)
|
|
yield return 0x000000007F7FFFFFul; // +Max Normal (float.MaxValue)
|
|
yield return 0x0000000000800000ul; // +Min Normal
|
|
yield return 0x00000000007FFFFFul; // +Max Subnormal
|
|
yield return 0x0000000000000001ul; // +Min Subnormal (float.Epsilon)
|
|
|
|
if (!NoZeros)
|
|
{
|
|
yield return 0x0000000080000000ul; // -Zero
|
|
yield return 0x0000000000000000ul; // +Zero
|
|
}
|
|
|
|
if (!NoInfs)
|
|
{
|
|
yield return 0x00000000FF800000ul; // -Infinity
|
|
yield return 0x000000007F800000ul; // +Infinity
|
|
}
|
|
|
|
if (!NoNaNs)
|
|
{
|
|
yield return 0x00000000FFC00000ul; // -QNaN (all zeros payload) (float.NaN)
|
|
yield return 0x00000000FFBFFFFFul; // -SNaN (all ones payload)
|
|
yield return 0x000000007FC00000ul; // +QNaN (all zeros payload) (-float.NaN) (DefaultNaN)
|
|
yield return 0x000000007FBFFFFFul; // +SNaN (all ones payload)
|
|
}
|
|
|
|
for (int cnt = 1; cnt <= RndCnt; cnt++)
|
|
{
|
|
ulong grbg = TestContext.CurrentContext.Random.NextUInt();
|
|
ulong rnd1 = GenNormalS();
|
|
ulong rnd2 = GenSubnormalS();
|
|
|
|
yield return (grbg << 32) | rnd1;
|
|
yield return (grbg << 32) | rnd2;
|
|
}
|
|
}
|
|
|
|
private static IEnumerable<ulong> _1D_F_()
|
|
{
|
|
yield return 0xFFEFFFFFFFFFFFFFul; // -Max Normal (double.MinValue)
|
|
yield return 0x8010000000000000ul; // -Min Normal
|
|
yield return 0x800FFFFFFFFFFFFFul; // -Max Subnormal
|
|
yield return 0x8000000000000001ul; // -Min Subnormal (-double.Epsilon)
|
|
yield return 0x7FEFFFFFFFFFFFFFul; // +Max Normal (double.MaxValue)
|
|
yield return 0x0010000000000000ul; // +Min Normal
|
|
yield return 0x000FFFFFFFFFFFFFul; // +Max Subnormal
|
|
yield return 0x0000000000000001ul; // +Min Subnormal (double.Epsilon)
|
|
|
|
if (!NoZeros)
|
|
{
|
|
yield return 0x8000000000000000ul; // -Zero
|
|
yield return 0x0000000000000000ul; // +Zero
|
|
}
|
|
|
|
if (!NoInfs)
|
|
{
|
|
yield return 0xFFF0000000000000ul; // -Infinity
|
|
yield return 0x7FF0000000000000ul; // +Infinity
|
|
}
|
|
|
|
if (!NoNaNs)
|
|
{
|
|
yield return 0xFFF8000000000000ul; // -QNaN (all zeros payload) (double.NaN)
|
|
yield return 0xFFF7FFFFFFFFFFFFul; // -SNaN (all ones payload)
|
|
yield return 0x7FF8000000000000ul; // +QNaN (all zeros payload) (-double.NaN) (DefaultNaN)
|
|
yield return 0x7FF7FFFFFFFFFFFFul; // +SNaN (all ones payload)
|
|
}
|
|
|
|
for (int cnt = 1; cnt <= RndCnt; cnt++)
|
|
{
|
|
ulong rnd1 = GenNormalD();
|
|
ulong rnd2 = GenSubnormalD();
|
|
|
|
yield return rnd1;
|
|
yield return rnd2;
|
|
}
|
|
}
|
|
#endregion
|
|
|
|
private const int RndCnt = 2;
|
|
|
|
private static readonly bool NoZeros = false;
|
|
private static readonly bool NoInfs = false;
|
|
private static readonly bool NoNaNs = false;
|
|
|
|
[Explicit]
|
|
[Test, Pairwise, Description("VCVT.<dt>.F32 <Sd>, <Sm>")]
|
|
public void Vcvt_F32_I32([Values(0u, 1u, 2u, 3u)] uint rd,
|
|
[Values(0u, 1u, 2u, 3u)] uint rm,
|
|
[ValueSource(nameof(_1S_F_))] ulong s0,
|
|
[ValueSource(nameof(_1S_F_))] ulong s1,
|
|
[ValueSource(nameof(_1S_F_))] ulong s2,
|
|
[ValueSource(nameof(_1S_F_))] ulong s3,
|
|
[Values] bool unsigned) // <U32, S32>
|
|
{
|
|
uint opcode = 0xeebc0ac0u; // VCVT.U32.F32 S0, S0
|
|
|
|
if (!unsigned)
|
|
{
|
|
opcode |= 1 << 16; // opc2<0>
|
|
}
|
|
|
|
opcode |= ((rd & 0x1e) << 11) | ((rd & 0x1) << 22);
|
|
opcode |= ((rm & 0x1e) >> 1) | ((rm & 0x1) << 5);
|
|
|
|
V128 v0 = MakeVectorE0E1E2E3((uint)s0, (uint)s1, (uint)s2, (uint)s3);
|
|
|
|
SingleOpcode(opcode, v0: v0);
|
|
|
|
CompareAgainstUnicorn();
|
|
}
|
|
|
|
[Explicit]
|
|
[Test, Pairwise, Description("VCVT.<dt>.F64 <Sd>, <Dm>")]
|
|
public void Vcvt_F64_I32([Values(0u, 1u, 2u, 3u)] uint rd,
|
|
[Values(0u, 1u)] uint rm,
|
|
[ValueSource(nameof(_1D_F_))] ulong d0,
|
|
[ValueSource(nameof(_1D_F_))] ulong d1,
|
|
[Values] bool unsigned) // <U32, S32>
|
|
{
|
|
uint opcode = 0xeebc0bc0u; // VCVT.U32.F64 S0, D0
|
|
|
|
if (!unsigned)
|
|
{
|
|
opcode |= 1 << 16; // opc2<0>
|
|
}
|
|
|
|
opcode |= ((rd & 0x1e) << 11) | ((rd & 0x1) << 22);
|
|
opcode |= ((rm & 0xf) << 0) | ((rm & 0x10) << 1);
|
|
|
|
V128 v0 = MakeVectorE0E1(d0, d1);
|
|
|
|
SingleOpcode(opcode, v0: v0);
|
|
|
|
CompareAgainstUnicorn();
|
|
}
|
|
|
|
[Explicit]
|
|
[Test, Pairwise, Description("VCVT.F32.<dt> <Sd>, <Sm>")]
|
|
public void Vcvt_I32_F32([Values(0u, 1u, 2u, 3u)] uint rd,
|
|
[Values(0u, 1u, 2u, 3u)] uint rm,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s0,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s1,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s2,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s3,
|
|
[Values] bool unsigned, // <U32, S32>
|
|
[Values(RMode.Rn)] RMode rMode)
|
|
{
|
|
uint opcode = 0xeeb80a40u; // VCVT.F32.U32 S0, S0
|
|
|
|
if (!unsigned)
|
|
{
|
|
opcode |= 1 << 7; // op
|
|
}
|
|
|
|
opcode |= ((rm & 0x1e) >> 1) | ((rm & 0x1) << 5);
|
|
opcode |= ((rd & 0x1e) << 11) | ((rd & 0x1) << 22);
|
|
|
|
V128 v0 = MakeVectorE0E1E2E3(s0, s1, s2, s3);
|
|
|
|
int fpscr = (int)rMode << (int)Fpcr.RMode;
|
|
|
|
SingleOpcode(opcode, v0: v0, fpscr: fpscr);
|
|
|
|
CompareAgainstUnicorn();
|
|
}
|
|
|
|
[Explicit]
|
|
[Test, Pairwise, Description("VCVT.F64.<dt> <Dd>, <Sm>")]
|
|
public void Vcvt_I32_F64([Values(0u, 1u)] uint rd,
|
|
[Values(0u, 1u, 2u, 3u)] uint rm,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s0,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s1,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s2,
|
|
[ValueSource(nameof(_1S_))] [Random(RndCnt)] uint s3,
|
|
[Values] bool unsigned, // <U32, S32>
|
|
[Values(RMode.Rn)] RMode rMode)
|
|
{
|
|
uint opcode = 0xeeb80b40u; // VCVT.F64.U32 D0, S0
|
|
|
|
if (!unsigned)
|
|
{
|
|
opcode |= 1 << 7; // op
|
|
}
|
|
|
|
opcode |= ((rm & 0x1e) >> 1) | ((rm & 0x1) << 5);
|
|
opcode |= ((rd & 0xf) << 12) | ((rd & 0x10) << 18);
|
|
|
|
V128 v0 = MakeVectorE0E1E2E3(s0, s1, s2, s3);
|
|
|
|
int fpscr = (int)rMode << (int)Fpcr.RMode;
|
|
|
|
SingleOpcode(opcode, v0: v0, fpscr: fpscr);
|
|
|
|
CompareAgainstUnicorn();
|
|
}
|
|
|
|
[Test, Pairwise, Description("VRINTX.F<size> <Sd>, <Sm>")]
|
|
public void Vrintx_S([Values(0u, 1u)] uint rd,
|
|
[Values(0u, 1u)] uint rm,
|
|
[Values(2u, 3u)] uint size,
|
|
[ValueSource(nameof(_1D_F_))] ulong s0,
|
|
[ValueSource(nameof(_1D_F_))] ulong s1,
|
|
[ValueSource(nameof(_1D_F_))] ulong s2,
|
|
[Values(RMode.Rn, RMode.Rm, RMode.Rp)] RMode rMode)
|
|
{
|
|
uint opcode = 0xEB70A40;
|
|
V128 v0, v1, v2;
|
|
if (size == 2)
|
|
{
|
|
opcode |= ((rm & 0x1e) >> 1) | ((rm & 0x1) << 5);
|
|
opcode |= ((rd & 0x1e) >> 11) | ((rm & 0x1) << 22);
|
|
v0 = MakeVectorE0E1((uint)BitConverter.SingleToInt32Bits(s0), (uint)BitConverter.SingleToInt32Bits(s0));
|
|
v1 = MakeVectorE0E1((uint)BitConverter.SingleToInt32Bits(s1), (uint)BitConverter.SingleToInt32Bits(s0));
|
|
v2 = MakeVectorE0E1((uint)BitConverter.SingleToInt32Bits(s2), (uint)BitConverter.SingleToInt32Bits(s1));
|
|
}
|
|
else
|
|
{
|
|
opcode |= ((rm & 0xf) << 0) | ((rd & 0x10) << 1);
|
|
opcode |= ((rd & 0xf) << 12) | ((rd & 0x10) << 18);
|
|
v0 = MakeVectorE0E1((uint)BitConverter.DoubleToInt64Bits(s0), (uint)BitConverter.DoubleToInt64Bits(s0));
|
|
v1 = MakeVectorE0E1((uint)BitConverter.DoubleToInt64Bits(s1), (uint)BitConverter.DoubleToInt64Bits(s0));
|
|
v2 = MakeVectorE0E1((uint)BitConverter.DoubleToInt64Bits(s2), (uint)BitConverter.DoubleToInt64Bits(s1));
|
|
}
|
|
|
|
opcode |= ((size & 3) << 8);
|
|
|
|
int fpscr = (int)rMode << (int)Fpcr.RMode;
|
|
SingleOpcode(opcode, v0: v0, v1: v1, v2: v2, fpscr: fpscr);
|
|
|
|
CompareAgainstUnicorn();
|
|
}
|
|
#endif
|
|
}
|
|
}
|