From e9eaa5222e63ca9b11c6eaeb283060b714f2becf Mon Sep 17 00:00:00 2001 From: Dmitry Pentin Date: Tue, 28 Sep 2021 23:29:57 +0300 Subject: [PATCH] FDCT fma usage --- .../Formats/Jpeg/Components/FastFloatingPointDCT.Intrinsic.cs | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/ImageSharp/Formats/Jpeg/Components/FastFloatingPointDCT.Intrinsic.cs b/src/ImageSharp/Formats/Jpeg/Components/FastFloatingPointDCT.Intrinsic.cs index f40ae6e874..ab9462632f 100644 --- a/src/ImageSharp/Formats/Jpeg/Components/FastFloatingPointDCT.Intrinsic.cs +++ b/src/ImageSharp/Formats/Jpeg/Components/FastFloatingPointDCT.Intrinsic.cs @@ -87,8 +87,8 @@ namespace SixLabors.ImageSharp.Formats.Jpeg.Components tmp12 = Avx.Add(tmp6, tmp7); Vector256 z5 = Avx.Multiply(Avx.Subtract(tmp10, tmp12), mm256_F_0_3826); - Vector256 z2 = Avx.Add(Avx.Multiply(mm256_F_0_5411, tmp10), z5); - Vector256 z4 = Avx.Add(Avx.Multiply(mm256_F_1_3065, tmp12), z5); + Vector256 z2 = SimdUtils.HwIntrinsics.MultiplyAdd(z5, mm256_F_0_5411, tmp10); + Vector256 z4 = SimdUtils.HwIntrinsics.MultiplyAdd(z5, mm256_F_1_3065, tmp12); Vector256 z3 = Avx.Multiply(tmp11, mm256_F_0_7071); Vector256 z11 = Avx.Add(tmp7, z3);