using ChocolArm64.Decoder; using ChocolArm64.State; using ChocolArm64.Translation; using System; using System.Reflection.Emit; using System.Runtime.Intrinsics; using System.Runtime.Intrinsics.X86; using static ChocolArm64.Instruction.AInstEmitSimdHelper; namespace ChocolArm64.Instruction { static partial class AInstEmit { public static void Fcvt_S(AILEmitterCtx Context) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; if (AOptimizations.UseSse2) { if (Op.Size == 1 && Op.Opc == 0) { //Double -> Single. AVectorHelper.EmitCall(Context, nameof(AVectorHelper.VectorSingleZero)); EmitLdvecWithCastToDouble(Context, Op.Rn); Type[] Types = new Type[] { typeof(Vector128<float>), typeof(Vector128<double>) }; Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ConvertScalarToVector128Single), Types)); Context.EmitStvec(Op.Rd); } else if (Op.Size == 0 && Op.Opc == 1) { //Single -> Double. AVectorHelper.EmitCall(Context, nameof(AVectorHelper.VectorDoubleZero)); Context.EmitLdvec(Op.Rn); Type[] Types = new Type[] { typeof(Vector128<double>), typeof(Vector128<float>) }; Context.EmitCall(typeof(Sse2).GetMethod(nameof(Sse2.ConvertScalarToVector128Double), Types)); EmitStvecWithCastFromDouble(Context, Op.Rd); } else { //Invalid encoding. throw new InvalidOperationException(); } } else { EmitVectorExtractF(Context, Op.Rn, 0, Op.Size); EmitFloatCast(Context, Op.Opc); EmitScalarSetF(Context, Op.Rd, Op.Opc); } } public static void Fcvtas_Gp(AILEmitterCtx Context) { EmitFcvt_s_Gp(Context, () => EmitRoundMathCall(Context, MidpointRounding.AwayFromZero)); } public static void Fcvtau_Gp(AILEmitterCtx Context) { EmitFcvt_u_Gp(Context, () => EmitRoundMathCall(Context, MidpointRounding.AwayFromZero)); } public static void Fcvtl_V(AILEmitterCtx Context) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; int SizeF = Op.Size & 1; int Elems = 4 >> SizeF; int Part = Context.CurrOp.RegisterSize == ARegisterSize.SIMD128 ? Elems : 0; for (int Index = 0; Index < Elems; Index++) { if (SizeF == 0) { EmitVectorExtractZx(Context, Op.Rn, Part + Index, 1); Context.Emit(OpCodes.Conv_U2); Context.EmitCall(typeof(ASoftFloat), nameof(ASoftFloat.ConvertHalfToSingle)); } else /* if (SizeF == 1) */ { EmitVectorExtractF(Context, Op.Rn, Part + Index, 0); Context.Emit(OpCodes.Conv_R8); } EmitVectorInsertF(Context, Op.Rd, Index, SizeF); } } public static void Fcvtms_Gp(AILEmitterCtx Context) { EmitFcvt_s_Gp(Context, () => EmitUnaryMathCall(Context, nameof(Math.Floor))); } public static void Fcvtmu_Gp(AILEmitterCtx Context) { EmitFcvt_u_Gp(Context, () => EmitUnaryMathCall(Context, nameof(Math.Floor))); } public static void Fcvtn_V(AILEmitterCtx Context) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; int SizeF = Op.Size & 1; int Elems = 4 >> SizeF; int Part = Context.CurrOp.RegisterSize == ARegisterSize.SIMD128 ? Elems : 0; for (int Index = 0; Index < Elems; Index++) { EmitVectorExtractF(Context, Op.Rd, Index, SizeF); if (SizeF == 0) { //TODO: This need the half precision floating point type, //that is not yet supported on .NET. We should probably //do our own implementation on the meantime. throw new NotImplementedException(); } else /* if (SizeF == 1) */ { Context.Emit(OpCodes.Conv_R4); EmitVectorInsertF(Context, Op.Rd, Part + Index, 0); } } if (Op.RegisterSize == ARegisterSize.SIMD64) { EmitVectorZeroUpper(Context, Op.Rd); } } public static void Fcvtns_S(AILEmitterCtx Context) { EmitFcvtn(Context, Signed: true, Scalar: true); } public static void Fcvtns_V(AILEmitterCtx Context) { EmitFcvtn(Context, Signed: true, Scalar: false); } public static void Fcvtnu_S(AILEmitterCtx Context) { EmitFcvtn(Context, Signed: false, Scalar: true); } public static void Fcvtnu_V(AILEmitterCtx Context) { EmitFcvtn(Context, Signed: false, Scalar: false); } public static void Fcvtps_Gp(AILEmitterCtx Context) { EmitFcvt_s_Gp(Context, () => EmitUnaryMathCall(Context, nameof(Math.Ceiling))); } public static void Fcvtpu_Gp(AILEmitterCtx Context) { EmitFcvt_u_Gp(Context, () => EmitUnaryMathCall(Context, nameof(Math.Ceiling))); } public static void Fcvtzs_Gp(AILEmitterCtx Context) { EmitFcvt_s_Gp(Context, () => { }); } public static void Fcvtzs_Gp_Fix(AILEmitterCtx Context) { EmitFcvtzs_Gp_Fix(Context); } public static void Fcvtzs_S(AILEmitterCtx Context) { EmitScalarFcvtzs(Context); } public static void Fcvtzs_V(AILEmitterCtx Context) { EmitVectorFcvtzs(Context); } public static void Fcvtzu_Gp(AILEmitterCtx Context) { EmitFcvt_u_Gp(Context, () => { }); } public static void Fcvtzu_Gp_Fix(AILEmitterCtx Context) { EmitFcvtzu_Gp_Fix(Context); } public static void Fcvtzu_S(AILEmitterCtx Context) { EmitScalarFcvtzu(Context); } public static void Fcvtzu_V(AILEmitterCtx Context) { EmitVectorFcvtzu(Context); } public static void Scvtf_Gp(AILEmitterCtx Context) { AOpCodeSimdCvt Op = (AOpCodeSimdCvt)Context.CurrOp; Context.EmitLdintzr(Op.Rn); if (Context.CurrOp.RegisterSize == ARegisterSize.Int32) { Context.Emit(OpCodes.Conv_U4); } EmitFloatCast(Context, Op.Size); EmitScalarSetF(Context, Op.Rd, Op.Size); } public static void Scvtf_S(AILEmitterCtx Context) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; EmitVectorExtractSx(Context, Op.Rn, 0, Op.Size + 2); EmitFloatCast(Context, Op.Size); EmitScalarSetF(Context, Op.Rd, Op.Size); } public static void Scvtf_V(AILEmitterCtx Context) { EmitVectorCvtf(Context, Signed: true); } public static void Ucvtf_Gp(AILEmitterCtx Context) { AOpCodeSimdCvt Op = (AOpCodeSimdCvt)Context.CurrOp; Context.EmitLdintzr(Op.Rn); if (Context.CurrOp.RegisterSize == ARegisterSize.Int32) { Context.Emit(OpCodes.Conv_U4); } Context.Emit(OpCodes.Conv_R_Un); EmitFloatCast(Context, Op.Size); EmitScalarSetF(Context, Op.Rd, Op.Size); } public static void Ucvtf_S(AILEmitterCtx Context) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; EmitVectorExtractZx(Context, Op.Rn, 0, Op.Size + 2); Context.Emit(OpCodes.Conv_R_Un); EmitFloatCast(Context, Op.Size); EmitScalarSetF(Context, Op.Rd, Op.Size); } public static void Ucvtf_V(AILEmitterCtx Context) { EmitVectorCvtf(Context, Signed: false); } private static int GetFBits(AILEmitterCtx Context) { if (Context.CurrOp is AOpCodeSimdShImm Op) { return GetImmShr(Op); } return 0; } private static void EmitFloatCast(AILEmitterCtx Context, int Size) { if (Size == 0) { Context.Emit(OpCodes.Conv_R4); } else if (Size == 1) { Context.Emit(OpCodes.Conv_R8); } else { throw new ArgumentOutOfRangeException(nameof(Size)); } } private static void EmitFcvtn(AILEmitterCtx Context, bool Signed, bool Scalar) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; int SizeF = Op.Size & 1; int SizeI = SizeF + 2; int Bytes = Op.GetBitsCount() >> 3; int Elems = !Scalar ? Bytes >> SizeI : 1; if (Scalar && (SizeF == 0)) { EmitVectorZeroLowerTmp(Context); } for (int Index = 0; Index < Elems; Index++) { EmitVectorExtractF(Context, Op.Rn, Index, SizeF); EmitRoundMathCall(Context, MidpointRounding.ToEven); if (SizeF == 0) { AVectorHelper.EmitCall(Context, Signed ? nameof(AVectorHelper.SatF32ToS32) : nameof(AVectorHelper.SatF32ToU32)); Context.Emit(OpCodes.Conv_U8); } else /* if (SizeF == 1) */ { AVectorHelper.EmitCall(Context, Signed ? nameof(AVectorHelper.SatF64ToS64) : nameof(AVectorHelper.SatF64ToU64)); } EmitVectorInsertTmp(Context, Index, SizeI); } Context.EmitLdvectmp(); Context.EmitStvec(Op.Rd); if ((Op.RegisterSize == ARegisterSize.SIMD64) || Scalar) { EmitVectorZeroUpper(Context, Op.Rd); } } private static void EmitFcvt_s_Gp(AILEmitterCtx Context, Action Emit) { EmitFcvt___Gp(Context, Emit, true); } private static void EmitFcvt_u_Gp(AILEmitterCtx Context, Action Emit) { EmitFcvt___Gp(Context, Emit, false); } private static void EmitFcvt___Gp(AILEmitterCtx Context, Action Emit, bool Signed) { AOpCodeSimdCvt Op = (AOpCodeSimdCvt)Context.CurrOp; EmitVectorExtractF(Context, Op.Rn, 0, Op.Size); Emit(); if (Signed) { EmitScalarFcvts(Context, Op.Size, 0); } else { EmitScalarFcvtu(Context, Op.Size, 0); } if (Context.CurrOp.RegisterSize == ARegisterSize.Int32) { Context.Emit(OpCodes.Conv_U8); } Context.EmitStintzr(Op.Rd); } private static void EmitFcvtzs_Gp_Fix(AILEmitterCtx Context) { EmitFcvtz__Gp_Fix(Context, true); } private static void EmitFcvtzu_Gp_Fix(AILEmitterCtx Context) { EmitFcvtz__Gp_Fix(Context, false); } private static void EmitFcvtz__Gp_Fix(AILEmitterCtx Context, bool Signed) { AOpCodeSimdCvt Op = (AOpCodeSimdCvt)Context.CurrOp; EmitVectorExtractF(Context, Op.Rn, 0, Op.Size); if (Signed) { EmitScalarFcvts(Context, Op.Size, Op.FBits); } else { EmitScalarFcvtu(Context, Op.Size, Op.FBits); } if (Context.CurrOp.RegisterSize == ARegisterSize.Int32) { Context.Emit(OpCodes.Conv_U8); } Context.EmitStintzr(Op.Rd); } private static void EmitVectorScvtf(AILEmitterCtx Context) { EmitVectorCvtf(Context, true); } private static void EmitVectorUcvtf(AILEmitterCtx Context) { EmitVectorCvtf(Context, false); } private static void EmitVectorCvtf(AILEmitterCtx Context, bool Signed) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; int SizeF = Op.Size & 1; int SizeI = SizeF + 2; int FBits = GetFBits(Context); int Bytes = Op.GetBitsCount() >> 3; for (int Index = 0; Index < (Bytes >> SizeI); Index++) { EmitVectorExtract(Context, Op.Rn, Index, SizeI, Signed); if (!Signed) { Context.Emit(OpCodes.Conv_R_Un); } Context.Emit(SizeF == 0 ? OpCodes.Conv_R4 : OpCodes.Conv_R8); EmitI2fFBitsMul(Context, SizeF, FBits); EmitVectorInsertF(Context, Op.Rd, Index, SizeF); } if (Op.RegisterSize == ARegisterSize.SIMD64) { EmitVectorZeroUpper(Context, Op.Rd); } } private static void EmitScalarFcvtzs(AILEmitterCtx Context) { EmitScalarFcvtz(Context, true); } private static void EmitScalarFcvtzu(AILEmitterCtx Context) { EmitScalarFcvtz(Context, false); } private static void EmitScalarFcvtz(AILEmitterCtx Context, bool Signed) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; int SizeF = Op.Size & 1; int SizeI = SizeF + 2; int FBits = GetFBits(Context); EmitVectorExtractF(Context, Op.Rn, 0, SizeF); EmitF2iFBitsMul(Context, SizeF, FBits); if (SizeF == 0) { AVectorHelper.EmitCall(Context, Signed ? nameof(AVectorHelper.SatF32ToS32) : nameof(AVectorHelper.SatF32ToU32)); } else /* if (SizeF == 1) */ { AVectorHelper.EmitCall(Context, Signed ? nameof(AVectorHelper.SatF64ToS64) : nameof(AVectorHelper.SatF64ToU64)); } if (SizeF == 0) { Context.Emit(OpCodes.Conv_U8); } EmitScalarSet(Context, Op.Rd, SizeI); } private static void EmitVectorFcvtzs(AILEmitterCtx Context) { EmitVectorFcvtz(Context, true); } private static void EmitVectorFcvtzu(AILEmitterCtx Context) { EmitVectorFcvtz(Context, false); } private static void EmitVectorFcvtz(AILEmitterCtx Context, bool Signed) { AOpCodeSimd Op = (AOpCodeSimd)Context.CurrOp; int SizeF = Op.Size & 1; int SizeI = SizeF + 2; int FBits = GetFBits(Context); int Bytes = Op.GetBitsCount() >> 3; for (int Index = 0; Index < (Bytes >> SizeI); Index++) { EmitVectorExtractF(Context, Op.Rn, Index, SizeF); EmitF2iFBitsMul(Context, SizeF, FBits); if (SizeF == 0) { AVectorHelper.EmitCall(Context, Signed ? nameof(AVectorHelper.SatF32ToS32) : nameof(AVectorHelper.SatF32ToU32)); } else /* if (SizeF == 1) */ { AVectorHelper.EmitCall(Context, Signed ? nameof(AVectorHelper.SatF64ToS64) : nameof(AVectorHelper.SatF64ToU64)); } if (SizeF == 0) { Context.Emit(OpCodes.Conv_U8); } EmitVectorInsert(Context, Op.Rd, Index, SizeI); } if (Op.RegisterSize == ARegisterSize.SIMD64) { EmitVectorZeroUpper(Context, Op.Rd); } } private static void EmitScalarFcvts(AILEmitterCtx Context, int Size, int FBits) { if (Size < 0 || Size > 1) { throw new ArgumentOutOfRangeException(nameof(Size)); } EmitF2iFBitsMul(Context, Size, FBits); if (Context.CurrOp.RegisterSize == ARegisterSize.Int32) { if (Size == 0) { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF32ToS32)); } else /* if (Size == 1) */ { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF64ToS32)); } } else { if (Size == 0) { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF32ToS64)); } else /* if (Size == 1) */ { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF64ToS64)); } } } private static void EmitScalarFcvtu(AILEmitterCtx Context, int Size, int FBits) { if (Size < 0 || Size > 1) { throw new ArgumentOutOfRangeException(nameof(Size)); } EmitF2iFBitsMul(Context, Size, FBits); if (Context.CurrOp.RegisterSize == ARegisterSize.Int32) { if (Size == 0) { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF32ToU32)); } else /* if (Size == 1) */ { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF64ToU32)); } } else { if (Size == 0) { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF32ToU64)); } else /* if (Size == 1) */ { AVectorHelper.EmitCall(Context, nameof(AVectorHelper.SatF64ToU64)); } } } private static void EmitF2iFBitsMul(AILEmitterCtx Context, int Size, int FBits) { if (FBits != 0) { if (Size == 0) { Context.EmitLdc_R4(MathF.Pow(2, FBits)); } else if (Size == 1) { Context.EmitLdc_R8(Math.Pow(2, FBits)); } else { throw new ArgumentOutOfRangeException(nameof(Size)); } Context.Emit(OpCodes.Mul); } } private static void EmitI2fFBitsMul(AILEmitterCtx Context, int Size, int FBits) { if (FBits != 0) { if (Size == 0) { Context.EmitLdc_R4(1f / MathF.Pow(2, FBits)); } else if (Size == 1) { Context.EmitLdc_R8(1 / Math.Pow(2, FBits)); } else { throw new ArgumentOutOfRangeException(nameof(Size)); } Context.Emit(OpCodes.Mul); } } } }