2018-10-26 00:10:41 +02:00
|
|
|
// https://github.com/intel/ARM_NEON_2_x86_SSE/blob/master/NEON_2_SSE.h
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
using ChocolArm64.Decoder;
|
|
|
|
using ChocolArm64.State;
|
|
|
|
using ChocolArm64.Translation;
|
|
|
|
using System;
|
|
|
|
using System.Reflection;
|
|
|
|
using System.Reflection.Emit;
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
using System.Runtime.Intrinsics;
|
2018-05-12 01:10:27 +02:00
|
|
|
using System.Runtime.Intrinsics.X86;
|
2018-02-17 22:06:11 +01:00
|
|
|
|
|
|
|
using static ChocolArm64.Instruction.AInstEmitSimdHelper;
|
|
|
|
|
|
|
|
namespace ChocolArm64.Instruction
|
|
|
|
{
|
|
|
|
static partial class AInstEmit
|
|
|
|
{
|
2018-04-18 15:56:27 +02:00
|
|
|
public static void Abs_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpSx(Context, () => EmitAbs(Context));
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Abs_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpSx(Context, () => EmitAbs(Context));
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Add_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpZx(Context, () => Context.Emit(OpCodes.Add));
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Add_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
if (AOptimizations.UseSse2)
|
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitSse2Op(Context, nameof(Sse2.Add));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpZx(Context, () => Context.Emit(OpCodes.Add));
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-04-20 17:40:15 +02:00
|
|
|
public static void Addhn_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitHighNarrow(Context, () => Context.Emit(OpCodes.Add), Round: false);
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Addp_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, 0, Op.Size);
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, 1, Op.Size);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
EmitScalarSet(Context, Op.Rd, Op.Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Addp_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-07-03 08:31:48 +02:00
|
|
|
EmitVectorPairwiseOpZx(Context, () => Context.Emit(OpCodes.Add));
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Addv_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
2018-07-14 18:13:02 +02:00
|
|
|
int Bytes = Op.GetBitsCount() >> 3;
|
|
|
|
int Elems = Bytes >> Op.Size;
|
2018-02-17 22:06:11 +01:00
|
|
|
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, 0, Op.Size);
|
|
|
|
|
2018-07-14 18:13:02 +02:00
|
|
|
for (int Index = 1; Index < Elems; Index++)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, Index, Op.Size);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
}
|
|
|
|
|
|
|
|
EmitScalarSet(Context, Op.Rd, Op.Size);
|
|
|
|
}
|
|
|
|
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
public static void Cls_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-14 04:35:16 +02:00
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
int Bytes = Op.GetBitsCount() >> 3;
|
|
|
|
int Elems = Bytes >> Op.Size;
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
int ESize = 8 << Op.Size;
|
|
|
|
|
|
|
|
for (int Index = 0; Index < Elems; Index++)
|
|
|
|
{
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, Index, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(ESize);
|
|
|
|
|
|
|
|
ASoftFallback.EmitCall(Context, nameof(ASoftFallback.CountLeadingSigns));
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
EmitVectorInsert(Context, Op.Rd, Index, Op.Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
}
|
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
public static void Clz_V(AILEmitterCtx Context)
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
2018-07-14 18:13:02 +02:00
|
|
|
int Bytes = Op.GetBitsCount() >> 3;
|
|
|
|
int Elems = Bytes >> Op.Size;
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
|
2018-07-14 20:07:44 +02:00
|
|
|
int ESize = 8 << Op.Size;
|
|
|
|
|
2018-07-14 18:13:02 +02:00
|
|
|
for (int Index = 0; Index < Elems; Index++)
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
{
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, Index, Op.Size);
|
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
if (Lzcnt.IsSupported && ESize == 32)
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Conv_U4);
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
Context.EmitCall(typeof(Lzcnt).GetMethod(nameof(Lzcnt.LeadingZeroCount), new Type[] { typeof(uint) }));
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Conv_U8);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
Context.EmitLdc_I4(ESize);
|
|
|
|
|
|
|
|
ASoftFallback.EmitCall(Context, nameof(ASoftFallback.CountLeadingZeros));
|
|
|
|
}
|
Add Cls_V, Clz_V, Orn_V instructions. Add 18 Tests: And_V, Bic_V, Bif_V, Bit_V, Bsl_V, Cls_V, Clz_V, Orn_V, Orr_V. (#104)
* Update AOpCodeTable.cs
* Update AInstEmitSimdLogical.cs
* Update AInstEmitSimdArithmetic.cs
* Update ASoftFallback.cs
* Update AInstEmitAlu.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
2018-04-26 04:20:22 +02:00
|
|
|
|
|
|
|
EmitVectorInsert(Context, Op.Rd, Index, Op.Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Cnt_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
int Elems = Op.RegisterSize == ARegisterSize.SIMD128 ? 16 : 8;
|
|
|
|
|
|
|
|
for (int Index = 0; Index < Elems; Index++)
|
|
|
|
{
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, Index, 0);
|
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
if (Popcnt.IsSupported)
|
|
|
|
{
|
|
|
|
Context.EmitCall(typeof(Popcnt).GetMethod(nameof(Popcnt.PopCount), new Type[] { typeof(ulong) }));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
ASoftFallback.EmitCall(Context, nameof(ASoftFallback.CountSetBits8));
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
|
|
|
|
EmitVectorInsert(Context, Op.Rd, Index, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-02-24 22:47:08 +01:00
|
|
|
public static void Fabd_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
|
|
|
|
EmitUnaryMathCall(Context, nameof(Math.Abs));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fabs_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnaryMathCall(Context, nameof(Math.Abs));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-06-12 14:29:16 +02:00
|
|
|
public static void Fabs_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnaryMathCall(Context, nameof(Math.Abs));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fadd_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitScalarSseOrSse2OpF(Context, nameof(Sse.AddScalar));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPAdd));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitVectorSseOrSse2OpF(Context, nameof(Sse.Add));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPAdd));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-06-18 05:41:28 +02:00
|
|
|
public static void Faddp_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
int SizeF = Op.Size & 1;
|
|
|
|
|
|
|
|
EmitVectorExtractF(Context, Op.Rn, 0, SizeF);
|
|
|
|
EmitVectorExtractF(Context, Op.Rn, 1, SizeF);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
EmitScalarSetF(Context, Op.Rd, SizeF);
|
|
|
|
}
|
|
|
|
|
2018-04-05 03:13:10 +02:00
|
|
|
public static void Faddp_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-09-22 22:26:18 +02:00
|
|
|
EmitVectorPairwiseOpF(Context, () => Context.Emit(OpCodes.Add));
|
2018-04-05 03:13:10 +02:00
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fdiv_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitScalarSseOrSse2OpF(Context, nameof(Sse.DivideScalar));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPDiv));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-02-20 20:04:22 +01:00
|
|
|
public static void Fdiv_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitVectorSseOrSse2OpF(Context, nameof(Sse.Divide));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPDiv));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-20 20:04:22 +01:00
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fmadd_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse2)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (Op.Size == 0)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesMulAdd = new Type[] { typeof(Vector128<float>), typeof(Vector128<float>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
Context.EmitLdvec(Op.Ra);
|
|
|
|
Context.EmitLdvec(Op.Rn);
|
|
|
|
Context.EmitLdvec(Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MultiplyScalar), TypesMulAdd));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.AddScalar), TypesMulAdd));
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZero32_128(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
else /* if (Op.Size == 1) */
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesMulAdd = new Type[] { typeof(Vector128<double>), typeof(Vector128<double>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Ra);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rn);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.MultiplyScalar), TypesMulAdd));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.AddScalar), TypesMulAdd));
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
|
|
|
|
EmitStvecWithCastFromDouble(Context, Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitScalarTernaryRaOpF(Context, () =>
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMulAdd));
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
});
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmax_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarSseOrSse2OpF(Context, nameof(Sse.MaxScalar));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMax));
|
|
|
|
});
|
|
|
|
}
|
2018-04-19 05:22:12 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmax_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-08-05 07:54:21 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorSseOrSse2OpF(Context, nameof(Sse.Max));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMax));
|
|
|
|
});
|
|
|
|
}
|
2018-08-05 07:54:21 +02:00
|
|
|
}
|
2018-04-19 05:22:12 +02:00
|
|
|
|
2018-08-05 07:54:21 +02:00
|
|
|
public static void Fmaxnm_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMaxNum));
|
2018-08-05 07:54:21 +02:00
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmaxnm_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-04-19 05:22:12 +02:00
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMaxNum));
|
2018-02-17 22:06:11 +01:00
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-09-22 22:26:18 +02:00
|
|
|
public static void Fmaxp_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorPairwiseOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMax));
|
|
|
|
});
|
2018-09-22 22:26:18 +02:00
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fmin_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarSseOrSse2OpF(Context, nameof(Sse.MinScalar));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMin));
|
|
|
|
});
|
|
|
|
}
|
2018-04-19 05:22:12 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmin_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-04-19 05:22:12 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorSseOrSse2OpF(Context, nameof(Sse.Min));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMin));
|
|
|
|
});
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-08-05 07:54:21 +02:00
|
|
|
public static void Fminnm_S(AILEmitterCtx Context)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-08-05 07:54:21 +02:00
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMinNum));
|
2018-08-05 07:54:21 +02:00
|
|
|
});
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-08-05 07:54:21 +02:00
|
|
|
public static void Fminnm_V(AILEmitterCtx Context)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-08-05 07:54:21 +02:00
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMinNum));
|
2018-08-05 07:54:21 +02:00
|
|
|
});
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-09-22 22:26:18 +02:00
|
|
|
public static void Fminp_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorPairwiseOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMin));
|
|
|
|
});
|
2018-09-22 22:26:18 +02:00
|
|
|
}
|
|
|
|
|
2018-06-29 01:51:38 +02:00
|
|
|
public static void Fmla_Se(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarTernaryOpByElemF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fmla_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmla_Ve(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpByElemF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
public static void Fmls_Se(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarTernaryOpByElemF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-04-06 06:41:54 +02:00
|
|
|
public static void Fmls_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmls_Ve(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpByElemF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fmsub_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse2)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (Op.Size == 0)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<float>), typeof(Vector128<float>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdvec(Op.Ra);
|
|
|
|
Context.EmitLdvec(Op.Rn);
|
|
|
|
Context.EmitLdvec(Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MultiplyScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SubtractScalar), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZero32_128(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
else /* if (Op.Size == 1) */
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<double>), typeof(Vector128<double>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Ra);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rn);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.MultiplyScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SubtractScalar), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitStvecWithCastFromDouble(Context, Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitScalarTernaryRaOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMulSub));
|
|
|
|
});
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmul_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitScalarSseOrSse2OpF(Context, nameof(Sse.MultiplyScalar));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMul));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-04-08 21:08:57 +02:00
|
|
|
public static void Fmul_Se(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpByElemF(Context, () => Context.Emit(OpCodes.Mul));
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fmul_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitVectorSseOrSse2OpF(Context, nameof(Sse.Multiply));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMul));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fmul_Ve(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpByElemF(Context, () => Context.Emit(OpCodes.Mul));
|
|
|
|
}
|
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
public static void Fmulx_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMulX));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
public static void Fmulx_Se(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpByElemF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMulX));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
public static void Fmulx_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMulX));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-10-14 04:35:16 +02:00
|
|
|
public static void Fmulx_Ve(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpByElemF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPMulX));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Fneg_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpF(Context, () => Context.Emit(OpCodes.Neg));
|
|
|
|
}
|
|
|
|
|
2018-04-04 21:36:07 +02:00
|
|
|
public static void Fneg_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () => Context.Emit(OpCodes.Neg));
|
|
|
|
}
|
|
|
|
|
2018-03-24 04:23:42 +01:00
|
|
|
public static void Fnmadd_S(AILEmitterCtx Context)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-03-24 04:23:42 +01:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
int SizeF = Op.Size & 1;
|
|
|
|
|
|
|
|
EmitVectorExtractF(Context, Op.Rn, 0, SizeF);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Neg);
|
|
|
|
|
|
|
|
EmitVectorExtractF(Context, Op.Rm, 0, SizeF);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
|
|
|
|
EmitVectorExtractF(Context, Op.Ra, 0, SizeF);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
|
|
|
|
EmitScalarSetF(Context, Op.Rd, SizeF);
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-02-20 18:39:03 +01:00
|
|
|
public static void Fnmsub_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
int SizeF = Op.Size & 1;
|
2018-03-30 17:37:07 +02:00
|
|
|
|
2018-02-20 18:39:03 +01:00
|
|
|
EmitVectorExtractF(Context, Op.Rn, 0, SizeF);
|
|
|
|
EmitVectorExtractF(Context, Op.Rm, 0, SizeF);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
|
|
|
|
EmitVectorExtractF(Context, Op.Ra, 0, SizeF);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
|
|
|
|
EmitScalarSetF(Context, Op.Rd, SizeF);
|
|
|
|
}
|
|
|
|
|
2018-03-24 04:23:42 +01:00
|
|
|
public static void Fnmul_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Neg);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-04-08 21:08:57 +02:00
|
|
|
public static void Frecpe_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-07-08 21:54:47 +02:00
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
2018-04-08 21:08:57 +02:00
|
|
|
{
|
2018-07-08 21:54:47 +02:00
|
|
|
EmitUnarySoftFloatCall(Context, nameof(ASoftFloat.RecipEstimate));
|
|
|
|
});
|
2018-04-08 21:08:57 +02:00
|
|
|
}
|
|
|
|
|
2018-07-08 21:54:47 +02:00
|
|
|
public static void Frecpe_V(AILEmitterCtx Context)
|
2018-04-08 21:08:57 +02:00
|
|
|
{
|
2018-07-08 21:54:47 +02:00
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
2018-04-08 21:08:57 +02:00
|
|
|
{
|
2018-07-08 21:54:47 +02:00
|
|
|
EmitUnarySoftFloatCall(Context, nameof(ASoftFloat.RecipEstimate));
|
|
|
|
});
|
2018-04-08 21:08:57 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Frecps_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse2)
|
2018-04-08 21:08:57 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
int SizeF = Op.Size & 1;
|
|
|
|
|
|
|
|
if (SizeF == 0)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSsv = new Type[] { typeof(float) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<float>), typeof(Vector128<float>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R4(2f);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SetScalarVector128), TypesSsv));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdvec(Op.Rn);
|
|
|
|
Context.EmitLdvec(Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MultiplyScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SubtractScalar), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZero32_128(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
else /* if (SizeF == 1) */
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSsv = new Type[] { typeof(double) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<double>), typeof(Vector128<double>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R8(2d);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetScalarVector128), TypesSsv));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rn);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.MultiplyScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SubtractScalar), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitStvecWithCastFromDouble(Context, Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPRecipStepFused));
|
|
|
|
});
|
|
|
|
}
|
2018-04-08 21:08:57 +02:00
|
|
|
}
|
|
|
|
|
2018-07-08 21:54:47 +02:00
|
|
|
public static void Frecps_V(AILEmitterCtx Context)
|
2018-04-08 21:08:57 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse2)
|
2018-04-08 21:08:57 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
int SizeF = Op.Size & 1;
|
|
|
|
|
|
|
|
if (SizeF == 0)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSav = new Type[] { typeof(float) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<float>), typeof(Vector128<float>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R4(2f);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SetAllVector128), TypesSav));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdvec(Op.Rn);
|
|
|
|
Context.EmitLdvec(Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.Multiply), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.Subtract), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else /* if (SizeF == 1) */
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSav = new Type[] { typeof(double) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<double>), typeof(Vector128<double>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R8(2d);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), TypesSav));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rn);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Multiply), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitStvecWithCastFromDouble(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPRecipStepFused));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Frecpx_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPRecpX));
|
2018-07-08 21:54:47 +02:00
|
|
|
});
|
2018-04-08 21:08:57 +02:00
|
|
|
}
|
|
|
|
|
2018-03-24 04:23:42 +01:00
|
|
|
public static void Frinta_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
EmitVectorExtractF(Context, Op.Rn, 0, Op.Size);
|
|
|
|
|
|
|
|
EmitRoundMathCall(Context, MidpointRounding.AwayFromZero);
|
|
|
|
|
|
|
|
EmitScalarSetF(Context, Op.Rd, Op.Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Frinta_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitRoundMathCall(Context, MidpointRounding.AwayFromZero);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-03-23 11:40:23 +01:00
|
|
|
public static void Frinti_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.EmitLdarg(ATranslatedSub.StateArgIdx);
|
|
|
|
|
|
|
|
if (Op.Size == 0)
|
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.RoundF));
|
2018-03-23 11:40:23 +01:00
|
|
|
}
|
|
|
|
else if (Op.Size == 1)
|
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.Round));
|
2018-03-23 11:40:23 +01:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
throw new InvalidOperationException();
|
|
|
|
}
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Frinti_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
2018-03-30 17:37:07 +02:00
|
|
|
|
2018-04-19 05:22:12 +02:00
|
|
|
int SizeF = Op.Size & 1;
|
|
|
|
|
2018-03-23 11:40:23 +01:00
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.EmitLdarg(ATranslatedSub.StateArgIdx);
|
|
|
|
|
2018-04-19 05:22:12 +02:00
|
|
|
if (SizeF == 0)
|
2018-03-30 17:37:07 +02:00
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.RoundF));
|
2018-03-23 11:40:23 +01:00
|
|
|
}
|
2018-04-19 05:22:12 +02:00
|
|
|
else if (SizeF == 1)
|
2018-03-30 17:37:07 +02:00
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.Round));
|
2018-03-23 11:40:23 +01:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
throw new InvalidOperationException();
|
|
|
|
}
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Frintm_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnaryMathCall(Context, nameof(Math.Floor));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-03-10 03:41:05 +01:00
|
|
|
public static void Frintm_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnaryMathCall(Context, nameof(Math.Floor));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-03-23 11:40:23 +01:00
|
|
|
public static void Frintn_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
EmitVectorExtractF(Context, Op.Rn, 0, Op.Size);
|
|
|
|
|
|
|
|
EmitRoundMathCall(Context, MidpointRounding.ToEven);
|
|
|
|
|
|
|
|
EmitScalarSetF(Context, Op.Rd, Op.Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Frintn_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitRoundMathCall(Context, MidpointRounding.ToEven);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-22 20:26:11 +01:00
|
|
|
public static void Frintp_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnaryMathCall(Context, nameof(Math.Ceiling));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-03-23 11:40:23 +01:00
|
|
|
public static void Frintp_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnaryMathCall(Context, nameof(Math.Ceiling));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-24 15:19:28 +01:00
|
|
|
public static void Frintx_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
2018-02-24 22:47:08 +01:00
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
2018-02-24 15:19:28 +01:00
|
|
|
{
|
2018-02-24 22:47:08 +01:00
|
|
|
Context.EmitLdarg(ATranslatedSub.StateArgIdx);
|
|
|
|
|
|
|
|
if (Op.Size == 0)
|
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.RoundF));
|
2018-02-24 22:47:08 +01:00
|
|
|
}
|
|
|
|
else if (Op.Size == 1)
|
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.Round));
|
2018-02-24 22:47:08 +01:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
throw new InvalidOperationException();
|
|
|
|
}
|
|
|
|
});
|
2018-02-24 15:19:28 +01:00
|
|
|
}
|
2018-03-23 11:40:23 +01:00
|
|
|
|
|
|
|
public static void Frintx_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
Context.EmitLdarg(ATranslatedSub.StateArgIdx);
|
|
|
|
|
|
|
|
if (Op.Size == 0)
|
2018-03-30 17:37:07 +02:00
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.RoundF));
|
2018-03-23 11:40:23 +01:00
|
|
|
}
|
|
|
|
else if (Op.Size == 1)
|
2018-03-30 17:37:07 +02:00
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
AVectorHelper.EmitCall(Context, nameof(AVectorHelper.Round));
|
2018-03-23 11:40:23 +01:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
throw new InvalidOperationException();
|
|
|
|
}
|
|
|
|
});
|
2018-04-06 01:36:19 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Frsqrte_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnarySoftFloatCall(Context, nameof(ASoftFloat.InvSqrtEstimate));
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Frsqrte_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitUnarySoftFloatCall(Context, nameof(ASoftFloat.InvSqrtEstimate));
|
|
|
|
});
|
2018-03-23 11:40:23 +01:00
|
|
|
}
|
2018-02-24 15:19:28 +01:00
|
|
|
|
2018-04-06 04:28:12 +02:00
|
|
|
public static void Frsqrts_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse2)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
2018-04-06 04:28:12 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
int SizeF = Op.Size & 1;
|
2018-04-06 15:20:17 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
if (SizeF == 0)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSsv = new Type[] { typeof(float) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<float>), typeof(Vector128<float>) };
|
2018-04-06 15:20:17 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
Context.EmitLdc_R4(0.5f);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SetScalarVector128), TypesSsv));
|
2018-04-06 15:20:17 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
Context.EmitLdc_R4(3f);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SetScalarVector128), TypesSsv));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdvec(Op.Rn);
|
|
|
|
Context.EmitLdvec(Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MultiplyScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SubtractScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.MultiplyScalar), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZero32_128(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
else /* if (SizeF == 1) */
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSsv = new Type[] { typeof(double) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<double>), typeof(Vector128<double>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R8(0.5d);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetScalarVector128), TypesSsv));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R8(3d);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetScalarVector128), TypesSsv));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rn);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.MultiplyScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SubtractScalar), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.MultiplyScalar), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitStvecWithCastFromDouble(Context, Op.Rd);
|
|
|
|
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
2018-04-06 15:20:17 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPRSqrtStepFused));
|
|
|
|
});
|
2018-04-06 15:20:17 +02:00
|
|
|
}
|
2018-04-06 04:28:12 +02:00
|
|
|
}
|
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
public static void Frsqrts_V(AILEmitterCtx Context)
|
2018-04-06 04:28:12 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse2)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
2018-04-06 04:28:12 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
int SizeF = Op.Size & 1;
|
2018-04-06 04:28:12 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
if (SizeF == 0)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSav = new Type[] { typeof(float) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<float>), typeof(Vector128<float>) };
|
2018-04-06 04:28:12 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
Context.EmitLdc_R4(0.5f);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SetAllVector128), TypesSav));
|
2018-04-06 15:20:17 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
Context.EmitLdc_R4(3f);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.SetAllVector128), TypesSav));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdvec(Op.Rn);
|
|
|
|
Context.EmitLdvec(Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.Multiply), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.Subtract), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse).GetMethod(nameof(Sse.Multiply), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else /* if (SizeF == 1) */
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSav = new Type[] { typeof(double) };
|
|
|
|
Type[] TypesMulSub = new Type[] { typeof(Vector128<double>), typeof(Vector128<double>) };
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R8(0.5d);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), TypesSav));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
Context.EmitLdc_R8(3d);
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), TypesSav));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rn);
|
|
|
|
EmitLdvecWithCastToDouble(Context, Op.Rm);
|
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Multiply), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesMulSub));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Multiply), TypesMulSub));
|
2018-10-06 03:45:59 +02:00
|
|
|
|
|
|
|
EmitStvecWithCastFromDouble(Context, Op.Rd);
|
|
|
|
}
|
2018-04-06 04:28:12 +02:00
|
|
|
}
|
2018-10-06 03:45:59 +02:00
|
|
|
else
|
2018-04-06 04:28:12 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPRSqrtStepFused));
|
|
|
|
});
|
2018-04-06 04:28:12 +02:00
|
|
|
}
|
2018-10-06 03:45:59 +02:00
|
|
|
}
|
2018-04-06 04:28:12 +02:00
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
public static void Fsqrt_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-04-06 15:20:17 +02:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarSseOrSse2OpF(Context, nameof(Sse.SqrtScalar));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPSqrt));
|
|
|
|
});
|
2018-04-06 15:20:17 +02:00
|
|
|
}
|
2018-04-06 04:28:12 +02:00
|
|
|
}
|
|
|
|
|
2018-10-06 03:45:59 +02:00
|
|
|
public static void Fsqrt_V(AILEmitterCtx Context)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorSseOrSse2OpF(Context, nameof(Sse.Sqrt));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPSqrt));
|
|
|
|
});
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fsub_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitScalarSseOrSse2OpF(Context, nameof(Sse.SubtractScalar));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitScalarBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPSub));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Fsub_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
if (AOptimizations.FastFP && AOptimizations.UseSse
|
|
|
|
&& AOptimizations.UseSse2)
|
2018-05-12 01:10:27 +02:00
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitVectorSseOrSse2OpF(Context, nameof(Sse.Subtract));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
2018-10-06 03:45:59 +02:00
|
|
|
EmitVectorBinaryOpF(Context, () =>
|
|
|
|
{
|
|
|
|
EmitSoftFloatCall(Context, nameof(ASoftFloat_32.FPSub));
|
|
|
|
});
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Mla_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-03-16 02:36:47 +01:00
|
|
|
public static void Mla_Ve(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpByElemZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-18 06:13:42 +01:00
|
|
|
public static void Mls_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-09-08 19:24:29 +02:00
|
|
|
public static void Mls_Ve(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpByElemZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Mul_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpZx(Context, () => Context.Emit(OpCodes.Mul));
|
|
|
|
}
|
|
|
|
|
2018-03-05 20:18:37 +01:00
|
|
|
public static void Mul_Ve(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpByElemZx(Context, () => Context.Emit(OpCodes.Mul));
|
|
|
|
}
|
|
|
|
|
2018-04-18 15:56:27 +02:00
|
|
|
public static void Neg_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarUnaryOpSx(Context, () => Context.Emit(OpCodes.Neg));
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Neg_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorUnaryOpSx(Context, () => Context.Emit(OpCodes.Neg));
|
|
|
|
}
|
|
|
|
|
2018-04-20 17:40:15 +02:00
|
|
|
public static void Raddhn_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitHighNarrow(Context, () => Context.Emit(OpCodes.Add), Round: true);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Rsubhn_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitHighNarrow(Context, () => Context.Emit(OpCodes.Sub), Round: true);
|
|
|
|
}
|
|
|
|
|
2018-06-30 17:40:41 +02:00
|
|
|
public static void Saba_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorTernaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sabal_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmTernaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sabd_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sabdl_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-08-13 23:10:02 +02:00
|
|
|
public static void Sadalp_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitAddLongPairwise(Context, Signed: true, Accumulate: true);
|
|
|
|
}
|
|
|
|
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
public static void Saddl_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
if (AOptimizations.UseSse41)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
Type[] TypesSrl = new Type[] { VectorIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesAdd = new Type[] { VectorIntTypesPerSizeLog2[Op.Size + 1],
|
|
|
|
VectorIntTypesPerSizeLog2[Op.Size + 1] };
|
|
|
|
|
|
|
|
string[] NamesCvt = new string[] { nameof(Sse41.ConvertToVector128Int16),
|
|
|
|
nameof(Sse41.ConvertToVector128Int32),
|
|
|
|
nameof(Sse41.ConvertToVector128Int64) };
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesAdd));
|
|
|
|
|
|
|
|
EmitStvecWithSignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpSx(Context, () => Context.Emit(OpCodes.Add));
|
|
|
|
}
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
}
|
|
|
|
|
2018-08-13 23:10:02 +02:00
|
|
|
public static void Saddlp_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitAddLongPairwise(Context, Signed: true, Accumulate: false);
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Saddw_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-02-20 18:39:03 +01:00
|
|
|
EmitVectorWidenRmBinaryOpSx(Context, () => Context.Emit(OpCodes.Add));
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Shadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse2 && Op.Size > 0)
|
2018-08-27 08:44:01 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSra = new Type[] { VectorIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesAndXorAdd = new Type[] { VectorIntTypesPerSizeLog2[Op.Size], VectorIntTypesPerSizeLog2[Op.Size] };
|
2018-08-27 08:44:01 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
Context.EmitStvectmp();
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
Context.EmitStvectmp2();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.And), TypesAndXorAdd));
|
|
|
|
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
Context.EmitLdvectmp2();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Xor), TypesAndXorAdd));
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(1);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightArithmetic), TypesSra));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesAndXorAdd));
|
|
|
|
|
|
|
|
EmitStvecWithSignedCast(Context, Op.Rd, Op.Size);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Shr);
|
|
|
|
});
|
|
|
|
}
|
2018-08-27 08:44:01 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Shsub_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse2 && Op.Size < 2)
|
2018-08-27 08:44:01 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSav = new Type[] { IntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesAddSub = new Type[] { VectorIntTypesPerSizeLog2 [Op.Size], VectorIntTypesPerSizeLog2 [Op.Size] };
|
|
|
|
Type[] TypesAvg = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], VectorUIntTypesPerSizeLog2[Op.Size] };
|
2018-08-27 08:44:01 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitLdc_I4(Op.Size == 0 ? sbyte.MinValue : short.MinValue);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), TypesSav));
|
|
|
|
|
|
|
|
Context.EmitStvectmp();
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesAddSub));
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesAddSub));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Average), TypesAvg));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesAddSub));
|
|
|
|
|
|
|
|
EmitStvecWithSignedCast(Context, Op.Rd, Op.Size);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Shr);
|
|
|
|
});
|
|
|
|
}
|
2018-08-27 08:44:01 +02:00
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Smax_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(long), typeof(long) };
|
|
|
|
|
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Max), Types);
|
|
|
|
|
|
|
|
EmitVectorBinaryOpSx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
2018-07-03 08:31:48 +02:00
|
|
|
public static void Smaxp_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(long), typeof(long) };
|
|
|
|
|
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Max), Types);
|
|
|
|
|
|
|
|
EmitVectorPairwiseOpSx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Smin_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(long), typeof(long) };
|
|
|
|
|
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Min), Types);
|
|
|
|
|
|
|
|
EmitVectorBinaryOpSx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
2018-07-03 08:31:48 +02:00
|
|
|
public static void Sminp_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(long), typeof(long) };
|
|
|
|
|
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Min), Types);
|
|
|
|
|
|
|
|
EmitVectorPairwiseOpSx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
2018-03-07 01:36:49 +01:00
|
|
|
public static void Smlal_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse41 && Op.Size < 2)
|
2018-03-07 01:36:49 +01:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSrl = new Type[] { VectorIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesMulAdd = new Type[] { VectorIntTypesPerSizeLog2[Op.Size + 1],
|
|
|
|
VectorIntTypesPerSizeLog2[Op.Size + 1] };
|
|
|
|
|
|
|
|
Type TypeMul = Op.Size == 0 ? typeof(Sse2) : typeof(Sse41);
|
|
|
|
|
|
|
|
string NameCvt = Op.Size == 0
|
|
|
|
? nameof(Sse41.ConvertToVector128Int16)
|
|
|
|
: nameof(Sse41.ConvertToVector128Int32);
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(TypeMul.GetMethod(nameof(Sse2.MultiplyLow), TypesMulAdd));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesMulAdd));
|
|
|
|
|
|
|
|
EmitStvecWithSignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmTernaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
2018-03-07 01:36:49 +01:00
|
|
|
}
|
|
|
|
|
2018-07-14 18:13:02 +02:00
|
|
|
public static void Smlsl_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse41 && Op.Size < 2)
|
2018-07-14 18:13:02 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSrl = new Type[] { VectorIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesMulSub = new Type[] { VectorIntTypesPerSizeLog2[Op.Size + 1],
|
|
|
|
VectorIntTypesPerSizeLog2[Op.Size + 1] };
|
|
|
|
|
|
|
|
Type TypeMul = Op.Size == 0 ? typeof(Sse2) : typeof(Sse41);
|
|
|
|
|
|
|
|
string NameCvt = Op.Size == 0
|
|
|
|
? nameof(Sse41.ConvertToVector128Int16)
|
|
|
|
: nameof(Sse41.ConvertToVector128Int32);
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(TypeMul.GetMethod(nameof(Sse2.MultiplyLow), TypesMulSub));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesMulSub));
|
|
|
|
|
|
|
|
EmitStvecWithSignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmTernaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
});
|
|
|
|
}
|
2018-07-14 18:13:02 +02:00
|
|
|
}
|
|
|
|
|
2018-02-20 18:39:03 +01:00
|
|
|
public static void Smull_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpSx(Context, () => Context.Emit(OpCodes.Mul));
|
|
|
|
}
|
|
|
|
|
2018-08-04 21:58:54 +02:00
|
|
|
public static void Sqabs_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingUnaryOpSx(Context, () => EmitAbs(Context));
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqabs_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingUnaryOpSx(Context, () => EmitAbs(Context));
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqadd_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingBinaryOpSx(Context, SaturatingFlags.Add);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingBinaryOpSx(Context, SaturatingFlags.Add);
|
|
|
|
}
|
|
|
|
|
2018-08-10 19:27:15 +02:00
|
|
|
public static void Sqdmulh_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitSaturatingBinaryOp(Context, () => EmitDoublingMultiplyHighHalf(Context, Round: false), SaturatingFlags.ScalarSx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqdmulh_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitSaturatingBinaryOp(Context, () => EmitDoublingMultiplyHighHalf(Context, Round: false), SaturatingFlags.VectorSx);
|
|
|
|
}
|
|
|
|
|
2018-08-04 21:58:54 +02:00
|
|
|
public static void Sqneg_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingUnaryOpSx(Context, () => Context.Emit(OpCodes.Neg));
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqneg_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingUnaryOpSx(Context, () => Context.Emit(OpCodes.Neg));
|
|
|
|
}
|
|
|
|
|
2018-08-10 19:27:15 +02:00
|
|
|
public static void Sqrdmulh_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitSaturatingBinaryOp(Context, () => EmitDoublingMultiplyHighHalf(Context, Round: true), SaturatingFlags.ScalarSx);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqrdmulh_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitSaturatingBinaryOp(Context, () => EmitDoublingMultiplyHighHalf(Context, Round: true), SaturatingFlags.VectorSx);
|
|
|
|
}
|
|
|
|
|
2018-08-04 21:58:54 +02:00
|
|
|
public static void Sqsub_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingBinaryOpSx(Context, SaturatingFlags.Sub);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqsub_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingBinaryOpSx(Context, SaturatingFlags.Sub);
|
|
|
|
}
|
|
|
|
|
2018-04-30 01:39:58 +02:00
|
|
|
public static void Sqxtn_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-09-17 06:54:05 +02:00
|
|
|
EmitSaturatingNarrowOp(Context, SaturatingNarrowFlags.ScalarSxSx);
|
2018-04-30 01:39:58 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqxtn_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-09-17 06:54:05 +02:00
|
|
|
EmitSaturatingNarrowOp(Context, SaturatingNarrowFlags.VectorSxSx);
|
2018-04-30 01:39:58 +02:00
|
|
|
}
|
|
|
|
|
2018-06-25 19:23:46 +02:00
|
|
|
public static void Sqxtun_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-09-17 06:54:05 +02:00
|
|
|
EmitSaturatingNarrowOp(Context, SaturatingNarrowFlags.ScalarSxZx);
|
2018-06-25 19:23:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sqxtun_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-09-17 06:54:05 +02:00
|
|
|
EmitSaturatingNarrowOp(Context, SaturatingNarrowFlags.VectorSxZx);
|
2018-06-25 19:23:46 +02:00
|
|
|
}
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Srhadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse2 && Op.Size < 2)
|
2018-08-27 08:44:01 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSav = new Type[] { IntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesSubAdd = new Type[] { VectorIntTypesPerSizeLog2 [Op.Size], VectorIntTypesPerSizeLog2 [Op.Size] };
|
|
|
|
Type[] TypesAvg = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], VectorUIntTypesPerSizeLog2[Op.Size] };
|
2018-08-27 08:44:01 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitLdc_I4(Op.Size == 0 ? sbyte.MinValue : short.MinValue);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.SetAllVector128), TypesSav));
|
2018-08-27 08:44:01 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
Context.EmitStvectmp();
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesSubAdd));
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesSubAdd));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Average), TypesAvg));
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesSubAdd));
|
|
|
|
|
|
|
|
EmitStvecWithSignedCast(Context, Op.Rd, Op.Size);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpSx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Shr);
|
|
|
|
});
|
|
|
|
}
|
2018-08-27 08:44:01 +02:00
|
|
|
}
|
|
|
|
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
public static void Ssubl_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
if (AOptimizations.UseSse41)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
Type[] TypesSrl = new Type[] { VectorIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesSub = new Type[] { VectorIntTypesPerSizeLog2[Op.Size + 1],
|
|
|
|
VectorIntTypesPerSizeLog2[Op.Size + 1] };
|
|
|
|
|
|
|
|
string[] NamesCvt = new string[] { nameof(Sse41.ConvertToVector128Int16),
|
|
|
|
nameof(Sse41.ConvertToVector128Int32),
|
|
|
|
nameof(Sse41.ConvertToVector128Int64) };
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithSignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesSub));
|
|
|
|
|
|
|
|
EmitStvecWithSignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpSx(Context, () => Context.Emit(OpCodes.Sub));
|
|
|
|
}
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
}
|
|
|
|
|
2018-07-19 02:06:28 +02:00
|
|
|
public static void Ssubw_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorWidenRmBinaryOpSx(Context, () => Context.Emit(OpCodes.Sub));
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Sub_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarBinaryOpZx(Context, () => Context.Emit(OpCodes.Sub));
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Sub_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-05-12 01:10:27 +02:00
|
|
|
if (AOptimizations.UseSse2)
|
|
|
|
{
|
Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics (#405)
* Optimize BIC, BSL, BIT, BIF, XTN, ZIP, DUP (Gp), FMADD (Scalar) and FCVT (Scalar) using SSE intrinsics, some CQ improvements
* Remove useless space
* Address PR feedback
* Revert EmitVectorZero32_128 changes
2018-09-27 04:30:21 +02:00
|
|
|
EmitSse2Op(Context, nameof(Sse2.Subtract));
|
2018-05-12 01:10:27 +02:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpZx(Context, () => Context.Emit(OpCodes.Sub));
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
|
|
|
|
2018-04-20 17:40:15 +02:00
|
|
|
public static void Subhn_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitHighNarrow(Context, () => Context.Emit(OpCodes.Sub), Round: false);
|
|
|
|
}
|
|
|
|
|
2018-08-04 21:58:54 +02:00
|
|
|
public static void Suqadd_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingBinaryOpSx(Context, SaturatingFlags.Accumulate);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Suqadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingBinaryOpSx(Context, SaturatingFlags.Accumulate);
|
|
|
|
}
|
|
|
|
|
2018-06-30 17:40:41 +02:00
|
|
|
public static void Uaba_V(AILEmitterCtx Context)
|
2018-03-30 21:30:23 +02:00
|
|
|
{
|
2018-06-30 17:40:41 +02:00
|
|
|
EmitVectorTernaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
2018-03-30 21:30:23 +02:00
|
|
|
}
|
|
|
|
|
2018-06-30 17:40:41 +02:00
|
|
|
public static void Uabal_V(AILEmitterCtx Context)
|
2018-03-30 21:16:16 +02:00
|
|
|
{
|
2018-06-30 17:40:41 +02:00
|
|
|
EmitVectorWidenRnRmTernaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
2018-03-30 21:30:23 +02:00
|
|
|
}
|
2018-03-30 21:16:16 +02:00
|
|
|
|
2018-06-30 17:40:41 +02:00
|
|
|
public static void Uabd_V(AILEmitterCtx Context)
|
2018-03-30 21:30:23 +02:00
|
|
|
{
|
2018-06-30 17:40:41 +02:00
|
|
|
EmitVectorBinaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
});
|
|
|
|
}
|
2018-03-30 21:16:16 +02:00
|
|
|
|
2018-06-30 17:40:41 +02:00
|
|
|
public static void Uabdl_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
EmitAbs(Context);
|
|
|
|
});
|
2018-03-30 21:16:16 +02:00
|
|
|
}
|
|
|
|
|
2018-08-13 23:10:02 +02:00
|
|
|
public static void Uadalp_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitAddLongPairwise(Context, Signed: false, Accumulate: true);
|
|
|
|
}
|
|
|
|
|
2018-03-30 20:55:28 +02:00
|
|
|
public static void Uaddl_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
if (AOptimizations.UseSse41)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
Type[] TypesSrl = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesAdd = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size + 1],
|
|
|
|
VectorUIntTypesPerSizeLog2[Op.Size + 1] };
|
|
|
|
|
|
|
|
string[] NamesCvt = new string[] { nameof(Sse41.ConvertToVector128Int16),
|
|
|
|
nameof(Sse41.ConvertToVector128Int32),
|
|
|
|
nameof(Sse41.ConvertToVector128Int64) };
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesAdd));
|
|
|
|
|
|
|
|
EmitStvecWithUnsignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpZx(Context, () => Context.Emit(OpCodes.Add));
|
|
|
|
}
|
2018-03-30 20:55:28 +02:00
|
|
|
}
|
|
|
|
|
2018-08-13 23:10:02 +02:00
|
|
|
public static void Uaddlp_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitAddLongPairwise(Context, Signed: false, Accumulate: false);
|
|
|
|
}
|
|
|
|
|
2018-02-17 22:06:11 +01:00
|
|
|
public static void Uaddlv_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
2018-07-14 18:13:02 +02:00
|
|
|
int Bytes = Op.GetBitsCount() >> 3;
|
|
|
|
int Elems = Bytes >> Op.Size;
|
2018-02-17 22:06:11 +01:00
|
|
|
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, 0, Op.Size);
|
|
|
|
|
2018-07-14 18:13:02 +02:00
|
|
|
for (int Index = 1; Index < Elems; Index++)
|
2018-02-17 22:06:11 +01:00
|
|
|
{
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, Index, Op.Size);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
}
|
|
|
|
|
|
|
|
EmitScalarSet(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Uaddw_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-02-20 18:39:03 +01:00
|
|
|
EmitVectorWidenRmBinaryOpZx(Context, () => Context.Emit(OpCodes.Add));
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
2018-03-02 23:21:54 +01:00
|
|
|
|
2018-03-30 17:37:07 +02:00
|
|
|
public static void Uhadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse2 && Op.Size > 0)
|
2018-03-30 17:37:07 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSrl = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesAndXorAdd = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], VectorUIntTypesPerSizeLog2[Op.Size] };
|
2018-03-30 17:37:07 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
Context.EmitStvectmp();
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
Context.EmitStvectmp2();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.And), TypesAndXorAdd));
|
|
|
|
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
Context.EmitLdvectmp2();
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Xor), TypesAndXorAdd));
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(1);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesAndXorAdd));
|
|
|
|
|
|
|
|
EmitStvecWithUnsignedCast(Context, Op.Rd, Op.Size);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Shr_Un);
|
|
|
|
});
|
|
|
|
}
|
2018-08-27 08:44:01 +02:00
|
|
|
}
|
2018-03-30 17:37:07 +02:00
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Uhsub_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse2 && Op.Size < 2)
|
2018-08-27 08:44:01 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesAvgSub = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], VectorUIntTypesPerSizeLog2[Op.Size] };
|
2018-08-27 08:44:01 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Average), TypesAvgSub));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesAvgSub));
|
|
|
|
|
|
|
|
EmitStvecWithUnsignedCast(Context, Op.Rd, Op.Size);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Shr_Un);
|
|
|
|
});
|
|
|
|
}
|
2018-03-30 17:37:07 +02:00
|
|
|
}
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Umax_V(AILEmitterCtx Context)
|
2018-07-03 08:31:48 +02:00
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(ulong), typeof(ulong) };
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Max), Types);
|
2018-07-03 08:31:48 +02:00
|
|
|
|
|
|
|
EmitVectorBinaryOpZx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Umaxp_V(AILEmitterCtx Context)
|
2018-07-03 08:31:48 +02:00
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(ulong), typeof(ulong) };
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Max), Types);
|
2018-07-03 08:31:48 +02:00
|
|
|
|
|
|
|
EmitVectorPairwiseOpZx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Umin_V(AILEmitterCtx Context)
|
2018-07-03 08:31:48 +02:00
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(ulong), typeof(ulong) };
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Min), Types);
|
2018-07-03 08:31:48 +02:00
|
|
|
|
|
|
|
EmitVectorBinaryOpZx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Uminp_V(AILEmitterCtx Context)
|
2018-07-03 08:31:48 +02:00
|
|
|
{
|
|
|
|
Type[] Types = new Type[] { typeof(ulong), typeof(ulong) };
|
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
MethodInfo MthdInfo = typeof(Math).GetMethod(nameof(Math.Min), Types);
|
2018-07-03 08:31:48 +02:00
|
|
|
|
|
|
|
EmitVectorPairwiseOpZx(Context, () => Context.EmitCall(MthdInfo));
|
|
|
|
}
|
|
|
|
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
public static void Umlal_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse41 && Op.Size < 2)
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSrl = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesMulAdd = new Type[] { VectorIntTypesPerSizeLog2 [Op.Size + 1],
|
|
|
|
VectorIntTypesPerSizeLog2 [Op.Size + 1] };
|
|
|
|
|
|
|
|
Type TypeMul = Op.Size == 0 ? typeof(Sse2) : typeof(Sse41);
|
|
|
|
|
|
|
|
string NameCvt = Op.Size == 0
|
|
|
|
? nameof(Sse41.ConvertToVector128Int16)
|
|
|
|
: nameof(Sse41.ConvertToVector128Int32);
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(TypeMul.GetMethod(nameof(Sse2.MultiplyLow), TypesMulAdd));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Add), TypesMulAdd));
|
|
|
|
|
|
|
|
EmitStvecWithUnsignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmTernaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
});
|
|
|
|
}
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Umlsl_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse41 && Op.Size < 2)
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesSrl = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesMulSub = new Type[] { VectorIntTypesPerSizeLog2 [Op.Size + 1],
|
|
|
|
VectorIntTypesPerSizeLog2 [Op.Size + 1] };
|
|
|
|
|
|
|
|
Type TypeMul = Op.Size == 0 ? typeof(Sse2) : typeof(Sse41);
|
|
|
|
|
|
|
|
string NameCvt = Op.Size == 0
|
|
|
|
? nameof(Sse41.ConvertToVector128Int16)
|
|
|
|
: nameof(Sse41.ConvertToVector128Int32);
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NameCvt, TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(TypeMul.GetMethod(nameof(Sse2.MultiplyLow), TypesMulSub));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesMulSub));
|
|
|
|
|
|
|
|
EmitStvecWithUnsignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmTernaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
Context.Emit(OpCodes.Sub);
|
|
|
|
});
|
|
|
|
}
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
}
|
|
|
|
|
2018-03-02 23:21:54 +01:00
|
|
|
public static void Umull_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpZx(Context, () => Context.Emit(OpCodes.Mul));
|
|
|
|
}
|
2018-04-30 01:39:58 +02:00
|
|
|
|
2018-08-04 21:58:54 +02:00
|
|
|
public static void Uqadd_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingBinaryOpZx(Context, SaturatingFlags.Add);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Uqadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingBinaryOpZx(Context, SaturatingFlags.Add);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Uqsub_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingBinaryOpZx(Context, SaturatingFlags.Sub);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Uqsub_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingBinaryOpZx(Context, SaturatingFlags.Sub);
|
|
|
|
}
|
|
|
|
|
2018-04-30 01:39:58 +02:00
|
|
|
public static void Uqxtn_S(AILEmitterCtx Context)
|
|
|
|
{
|
2018-09-17 06:54:05 +02:00
|
|
|
EmitSaturatingNarrowOp(Context, SaturatingNarrowFlags.ScalarZxZx);
|
2018-04-30 01:39:58 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
public static void Uqxtn_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-09-17 06:54:05 +02:00
|
|
|
EmitSaturatingNarrowOp(Context, SaturatingNarrowFlags.VectorZxZx);
|
2018-04-30 01:39:58 +02:00
|
|
|
}
|
2018-07-19 02:06:28 +02:00
|
|
|
|
2018-08-27 08:44:01 +02:00
|
|
|
public static void Urhadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
if (AOptimizations.UseSse2 && Op.Size < 2)
|
2018-08-27 08:44:01 +02:00
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
Type[] TypesAvg = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], VectorUIntTypesPerSizeLog2[Op.Size] };
|
2018-08-27 08:44:01 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
2018-08-27 08:44:01 +02:00
|
|
|
|
2018-10-26 00:10:41 +02:00
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Average), TypesAvg));
|
|
|
|
|
|
|
|
EmitStvecWithUnsignedCast(Context, Op.Rd, Op.Size);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorBinaryOpZx(Context, () =>
|
|
|
|
{
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_1);
|
|
|
|
Context.Emit(OpCodes.Shr_Un);
|
|
|
|
});
|
|
|
|
}
|
2018-08-27 08:44:01 +02:00
|
|
|
}
|
|
|
|
|
2018-08-04 21:58:54 +02:00
|
|
|
public static void Usqadd_S(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitScalarSaturatingBinaryOpZx(Context, SaturatingFlags.Accumulate);
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void Usqadd_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorSaturatingBinaryOpZx(Context, SaturatingFlags.Accumulate);
|
|
|
|
}
|
|
|
|
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
public static void Usubl_V(AILEmitterCtx Context)
|
|
|
|
{
|
2018-10-26 00:10:41 +02:00
|
|
|
if (AOptimizations.UseSse41)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
Type[] TypesSrl = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size], typeof(byte) };
|
|
|
|
Type[] TypesCvt = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size] };
|
|
|
|
Type[] TypesSub = new Type[] { VectorUIntTypesPerSizeLog2[Op.Size + 1],
|
|
|
|
VectorUIntTypesPerSizeLog2[Op.Size + 1] };
|
|
|
|
|
|
|
|
string[] NamesCvt = new string[] { nameof(Sse41.ConvertToVector128Int16),
|
|
|
|
nameof(Sse41.ConvertToVector128Int32),
|
|
|
|
nameof(Sse41.ConvertToVector128Int64) };
|
|
|
|
|
|
|
|
int NumBytes = Op.RegisterSize == ARegisterSize.SIMD128 ? 8 : 0;
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rn, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
EmitLdvecWithUnsignedCast(Context, Op.Rm, Op.Size);
|
|
|
|
|
|
|
|
Context.EmitLdc_I4(NumBytes);
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ShiftRightLogical128BitLane), TypesSrl));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse41).GetMethod(NamesCvt[Op.Size], TypesCvt));
|
|
|
|
|
|
|
|
Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.Subtract), TypesSub));
|
|
|
|
|
|
|
|
EmitStvecWithUnsignedCast(Context, Op.Rd, Op.Size + 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
EmitVectorWidenRnRmBinaryOpZx(Context, () => Context.Emit(OpCodes.Sub));
|
|
|
|
}
|
Add Fcvtns_S, Fcvtns_V, Fcvtnu_S, Fcvtnu_V (AOpCodeSimd) FP & Umlal_V, Umlsl_V, Saddl_V, Ssubl_V, Usubl_V instructions; add 8 FP & 16 S/Umlal_V, S/Umlsl_V, S/Uaddl_V, S/Usubl_V Tests. (#390)
* Update AOpCodeTable.cs
* Update AInstEmitSimdCvt.cs
* Update Pseudocode.cs
* Update Instructions.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Update CpuTestSimd.cs
* Update AOpCodeTable.cs
* Update AInstEmitSimdArithmetic.cs
* Update Instructions.cs
* Update CpuTestSimdReg.cs
* Add QCFlagBit.
* Add QCFlagBit.
2018-09-01 16:52:51 +02:00
|
|
|
}
|
|
|
|
|
2018-07-19 02:06:28 +02:00
|
|
|
public static void Usubw_V(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
EmitVectorWidenRmBinaryOpZx(Context, () => Context.Emit(OpCodes.Sub));
|
|
|
|
}
|
2018-09-22 22:26:18 +02:00
|
|
|
|
|
|
|
private static void EmitAbs(AILEmitterCtx Context)
|
|
|
|
{
|
|
|
|
AILLabel LblTrue = new AILLabel();
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
Context.Emit(OpCodes.Ldc_I4_0);
|
|
|
|
Context.Emit(OpCodes.Bge_S, LblTrue);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Neg);
|
|
|
|
|
|
|
|
Context.MarkLabel(LblTrue);
|
|
|
|
}
|
|
|
|
|
|
|
|
private static void EmitAddLongPairwise(AILEmitterCtx Context, bool Signed, bool Accumulate)
|
|
|
|
{
|
|
|
|
AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp;
|
|
|
|
|
|
|
|
int Words = Op.GetBitsCount() >> 4;
|
|
|
|
int Pairs = Words >> Op.Size;
|
|
|
|
|
|
|
|
for (int Index = 0; Index < Pairs; Index++)
|
|
|
|
{
|
|
|
|
int Idx = Index << 1;
|
|
|
|
|
|
|
|
EmitVectorExtract(Context, Op.Rn, Idx, Op.Size, Signed);
|
|
|
|
EmitVectorExtract(Context, Op.Rn, Idx + 1, Op.Size, Signed);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
if (Accumulate)
|
|
|
|
{
|
|
|
|
EmitVectorExtract(Context, Op.Rd, Index, Op.Size + 1, Signed);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
}
|
|
|
|
|
|
|
|
EmitVectorInsertTmp(Context, Index, Op.Size + 1);
|
|
|
|
}
|
|
|
|
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
if (Op.RegisterSize == ARegisterSize.SIMD64)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private static void EmitDoublingMultiplyHighHalf(AILEmitterCtx Context, bool Round)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
int ESize = 8 << Op.Size;
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Mul);
|
|
|
|
|
|
|
|
if (!Round)
|
|
|
|
{
|
|
|
|
Context.EmitAsr(ESize - 1);
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
long RoundConst = 1L << (ESize - 1);
|
|
|
|
|
|
|
|
AILLabel LblTrue = new AILLabel();
|
|
|
|
|
|
|
|
Context.EmitLsl(1);
|
|
|
|
|
|
|
|
Context.EmitLdc_I8(RoundConst);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
|
|
|
|
Context.EmitAsr(ESize);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Dup);
|
|
|
|
Context.EmitLdc_I8((long)int.MinValue);
|
|
|
|
Context.Emit(OpCodes.Bne_Un_S, LblTrue);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Neg);
|
|
|
|
|
|
|
|
Context.MarkLabel(LblTrue);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private static void EmitHighNarrow(AILEmitterCtx Context, Action Emit, bool Round)
|
|
|
|
{
|
|
|
|
AOpCodeSimdReg Op = (AOpCodeSimdReg)Context.CurrOp;
|
|
|
|
|
|
|
|
int Elems = 8 >> Op.Size;
|
|
|
|
|
|
|
|
int ESize = 8 << Op.Size;
|
|
|
|
|
|
|
|
int Part = Op.RegisterSize == ARegisterSize.SIMD128 ? Elems : 0;
|
|
|
|
|
|
|
|
long RoundConst = 1L << (ESize - 1);
|
|
|
|
|
|
|
|
if (Part != 0)
|
|
|
|
{
|
|
|
|
Context.EmitLdvec(Op.Rd);
|
|
|
|
Context.EmitStvectmp();
|
|
|
|
}
|
|
|
|
|
|
|
|
for (int Index = 0; Index < Elems; Index++)
|
|
|
|
{
|
|
|
|
EmitVectorExtractZx(Context, Op.Rn, Index, Op.Size + 1);
|
|
|
|
EmitVectorExtractZx(Context, Op.Rm, Index, Op.Size + 1);
|
|
|
|
|
|
|
|
Emit();
|
|
|
|
|
|
|
|
if (Round)
|
|
|
|
{
|
|
|
|
Context.EmitLdc_I8(RoundConst);
|
|
|
|
|
|
|
|
Context.Emit(OpCodes.Add);
|
|
|
|
}
|
|
|
|
|
|
|
|
Context.EmitLsr(ESize);
|
|
|
|
|
|
|
|
EmitVectorInsertTmp(Context, Part + Index, Op.Size);
|
|
|
|
}
|
|
|
|
|
|
|
|
Context.EmitLdvectmp();
|
|
|
|
Context.EmitStvec(Op.Rd);
|
|
|
|
|
|
|
|
if (Part == 0)
|
|
|
|
{
|
|
|
|
EmitVectorZeroUpper(Context, Op.Rd);
|
|
|
|
}
|
|
|
|
}
|
2018-02-17 22:06:11 +01:00
|
|
|
}
|
2018-04-08 21:08:57 +02:00
|
|
|
}
|