From 265b1bb37a75e8bb52bfbf3fd9a0e575a75a4a00 Mon Sep 17 00:00:00 2001 From: Cameron McInally Date: Thu, 13 Jun 2019 19:24:24 +0000 Subject: [PATCH] Revert "[NFC][CodeGen] Add unary FNeg tests to X86/avx512-intrinsics-fast-isel.ll" This reverts commit 41e0b9f2803089155536bdec7cbea6b82680a727. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@363301 91177308-0d34-0410-b5e6-96231b3b80d8 --- .../X86/avx512-intrinsics-fast-isel.ll | 657 ------------------ 1 file changed, 657 deletions(-) diff --git a/test/CodeGen/X86/avx512-intrinsics-fast-isel.ll b/test/CodeGen/X86/avx512-intrinsics-fast-isel.ll index 79ac74d72c9..f9c899555dd 100644 --- a/test/CodeGen/X86/avx512-intrinsics-fast-isel.ll +++ b/test/CodeGen/X86/avx512-intrinsics-fast-isel.ll @@ -3099,27 +3099,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_mask_fmsub_round_pd_unary_fneg(<8 x double> %__A, i8 zeroext %__U, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_mask_fmsub_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub132pd {rn-sae}, %zmm1, %zmm2, %zmm0 {%k1} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask_fmsub_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub132pd {rn-sae}, %zmm1, %zmm2, %zmm0 {%k1} -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %__A, <8 x double> %__B, <8 x double> %neg, i32 8) - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> %__A - ret <8 x double> %2 -} - define <8 x double> @test_mm512_maskz_fmsub_round_pd(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_maskz_fmsub_round_pd: ; X86: # %bb.0: # %entry @@ -3141,27 +3120,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_maskz_fmsub_round_pd_unary_fneg(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_maskz_fmsub_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub213pd {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fmsub_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub213pd {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %__A, <8 x double> %__B, <8 x double> %neg, i32 8) - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> zeroinitializer - ret <8 x double> %2 -} - define <8 x double> @test_mm512_fnmadd_round_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_fnmadd_round_pd: ; X86: # %bb.0: # %entry @@ -3180,24 +3138,6 @@ entry: ret <8 x double> %0 } -define <8 x double> @test_mm512_fnmadd_round_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_fnmadd_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxorq {{\.LCPI.*}}{1to8}, %zmm0, %zmm0 -; X86-NEXT: vfmadd213pd {rn-sae}, %zmm2, %zmm1, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fnmadd_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxorq {{.*}}(%rip){1to8}, %zmm0, %zmm0 -; X64-NEXT: vfmadd213pd {rn-sae}, %zmm2, %zmm1, %zmm0 -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__A - %0 = tail call <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %neg, <8 x double> %__B, <8 x double> %__C, i32 8) - ret <8 x double> %0 -} - define <8 x double> @test_mm512_mask3_fnmadd_round_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C, i8 zeroext %__U) { ; X86-LABEL: test_mm512_mask3_fnmadd_round_pd: ; X86: # %bb.0: # %entry @@ -3221,29 +3161,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_mask3_fnmadd_round_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C, i8 zeroext %__U) { -; X86-LABEL: test_mm512_mask3_fnmadd_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd231pd {rn-sae}, %zmm1, %zmm0, %zmm2 {%k1} -; X86-NEXT: vmovapd %zmm2, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask3_fnmadd_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd231pd {rn-sae}, %zmm1, %zmm0, %zmm2 {%k1} -; X64-NEXT: vmovapd %zmm2, %zmm0 -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__A - %0 = tail call <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %neg, <8 x double> %__B, <8 x double> %__C, i32 8) - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> %__C - ret <8 x double> %2 -} - define <8 x double> @test_mm512_maskz_fnmadd_round_pd(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_maskz_fnmadd_round_pd: ; X86: # %bb.0: # %entry @@ -3265,27 +3182,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_maskz_fnmadd_round_pd_unary_fneg(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_maskz_fnmadd_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd213pd {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmadd_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd213pd {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__A - %0 = tail call <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %neg, <8 x double> %__B, <8 x double> %__C, i32 8) - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> zeroinitializer - ret <8 x double> %2 -} - define <8 x double> @test_mm512_fnmsub_round_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; CHECK-LABEL: test_mm512_fnmsub_round_pd: ; CHECK: # %bb.0: # %entry @@ -3301,21 +3197,6 @@ entry: ret <8 x double> %0 } -define <8 x double> @test_mm512_fnmsub_round_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; CHECK-LABEL: test_mm512_fnmsub_round_pd_unary_fneg: -; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vpbroadcastq {{.*#+}} zmm3 = [-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0] -; CHECK-NEXT: vpxorq %zmm3, %zmm0, %zmm4 -; CHECK-NEXT: vpxorq %zmm3, %zmm2, %zmm0 -; CHECK-NEXT: vfmadd231pd {rn-sae}, %zmm4, %zmm1, %zmm0 -; CHECK-NEXT: ret{{[l|q]}} -entry: - %neg = fneg <8 x double> %__A - %neg1 = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %neg, <8 x double> %__B, <8 x double> %neg1, i32 8) - ret <8 x double> %0 -} - define <8 x double> @test_mm512_maskz_fnmsub_round_pd(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_maskz_fnmsub_round_pd: ; X86: # %bb.0: # %entry @@ -3338,28 +3219,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_maskz_fnmsub_round_pd_unary_fneg(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_maskz_fnmsub_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmsub213pd {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmsub_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmsub213pd {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__A - %neg1 = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.x86.avx512.vfmadd.pd.512(<8 x double> %neg, <8 x double> %__B, <8 x double> %neg1, i32 8) - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> zeroinitializer - ret <8 x double> %2 -} - define <8 x double> @test_mm512_fmadd_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; CHECK-LABEL: test_mm512_fmadd_pd: ; CHECK: # %bb.0: # %entry @@ -3450,24 +3309,6 @@ entry: ret <8 x double> %0 } -define <8 x double> @test_mm512_fmsub_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_fmsub_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxorq {{\.LCPI.*}}{1to8}, %zmm2, %zmm2 -; X86-NEXT: vfmadd213pd {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fmsub_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxorq {{.*}}(%rip){1to8}, %zmm2, %zmm2 -; X64-NEXT: vfmadd213pd {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %__A, <8 x double> %__B, <8 x double> %neg.i) #10 - ret <8 x double> %0 -} - define <8 x double> @test_mm512_mask_fmsub_pd(<8 x double> %__A, i8 zeroext %__U, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_mask_fmsub_pd: ; X86: # %bb.0: # %entry @@ -3489,27 +3330,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_mask_fmsub_pd_unary_fneg(<8 x double> %__A, i8 zeroext %__U, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_mask_fmsub_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub132pd {{.*#+}} zmm0 = (zmm0 * zmm1) - zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask_fmsub_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub132pd {{.*#+}} zmm0 = (zmm0 * zmm1) - zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %__A, <8 x double> %__B, <8 x double> %neg.i) #10 - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> %__A - ret <8 x double> %2 -} - define <8 x double> @test_mm512_maskz_fmsub_pd(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_maskz_fmsub_pd: ; X86: # %bb.0: # %entry @@ -3531,27 +3351,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_maskz_fmsub_pd_unary_fneg(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_maskz_fmsub_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub213pd {{.*#+}} zmm0 = (zmm1 * zmm0) - zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fmsub_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub213pd {{.*#+}} zmm0 = (zmm1 * zmm0) - zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %__A, <8 x double> %__B, <8 x double> %neg.i) #10 - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> zeroinitializer - ret <8 x double> %2 -} - define <8 x double> @test_mm512_fnmadd_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_fnmadd_pd: ; X86: # %bb.0: # %entry @@ -3570,24 +3369,6 @@ entry: ret <8 x double> %0 } -define <8 x double> @test_mm512_fnmadd_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_fnmadd_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxorq {{\.LCPI.*}}{1to8}, %zmm0, %zmm0 -; X86-NEXT: vfmadd213pd {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fnmadd_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxorq {{.*}}(%rip){1to8}, %zmm0, %zmm0 -; X64-NEXT: vfmadd213pd {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <8 x double> %__A - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %neg.i, <8 x double> %__B, <8 x double> %__C) #10 - ret <8 x double> %0 -} - define <8 x double> @test_mm512_mask3_fnmadd_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C, i8 zeroext %__U) { ; X86-LABEL: test_mm512_mask3_fnmadd_pd: ; X86: # %bb.0: # %entry @@ -3611,29 +3392,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_mask3_fnmadd_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C, i8 zeroext %__U) { -; X86-LABEL: test_mm512_mask3_fnmadd_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd231pd {{.*#+}} zmm2 = -(zmm0 * zmm1) + zmm2 -; X86-NEXT: vmovapd %zmm2, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask3_fnmadd_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd231pd {{.*#+}} zmm2 = -(zmm0 * zmm1) + zmm2 -; X64-NEXT: vmovapd %zmm2, %zmm0 -; X64-NEXT: retq -entry: - %neg.i = fneg <8 x double> %__A - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %neg.i, <8 x double> %__B, <8 x double> %__C) #10 - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> %__C - ret <8 x double> %2 -} - define <8 x double> @test_mm512_maskz_fnmadd_pd(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_maskz_fnmadd_pd: ; X86: # %bb.0: # %entry @@ -3655,27 +3413,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_maskz_fnmadd_pd_unary_fneg(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_maskz_fnmadd_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd213pd {{.*#+}} zmm0 = -(zmm1 * zmm0) + zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmadd_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd213pd {{.*#+}} zmm0 = -(zmm1 * zmm0) + zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <8 x double> %__A - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %neg.i, <8 x double> %__B, <8 x double> %__C) #10 - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> zeroinitializer - ret <8 x double> %2 -} - define <8 x double> @test_mm512_fnmsub_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; CHECK-LABEL: test_mm512_fnmsub_pd: ; CHECK: # %bb.0: # %entry @@ -3691,21 +3428,6 @@ entry: ret <8 x double> %0 } -define <8 x double> @test_mm512_fnmsub_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; CHECK-LABEL: test_mm512_fnmsub_pd_unary_fneg: -; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vpbroadcastq {{.*#+}} zmm3 = [-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0] -; CHECK-NEXT: vpxorq %zmm3, %zmm0, %zmm4 -; CHECK-NEXT: vpxorq %zmm3, %zmm2, %zmm0 -; CHECK-NEXT: vfmadd231pd {{.*#+}} zmm0 = (zmm1 * zmm4) + zmm0 -; CHECK-NEXT: ret{{[l|q]}} -entry: - %neg.i = fneg <8 x double> %__A - %neg1.i = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %neg.i, <8 x double> %__B, <8 x double> %neg1.i) #10 - ret <8 x double> %0 -} - define <8 x double> @test_mm512_maskz_fnmsub_pd(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_maskz_fnmsub_pd: ; X86: # %bb.0: # %entry @@ -3728,28 +3450,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_maskz_fnmsub_pd_unary_fneg(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_maskz_fnmsub_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmsub213pd {{.*#+}} zmm0 = -(zmm1 * zmm0) - zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmsub_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmsub213pd {{.*#+}} zmm0 = -(zmm1 * zmm0) - zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <8 x double> %__A - %neg1.i = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.fma.v8f64(<8 x double> %neg.i, <8 x double> %__B, <8 x double> %neg1.i) #10 - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> zeroinitializer - ret <8 x double> %2 -} - define <16 x float> @test_mm512_fmadd_round_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; CHECK-LABEL: test_mm512_fmadd_round_ps: ; CHECK: # %bb.0: # %entry @@ -3842,24 +3542,6 @@ entry: ret <16 x float> %0 } -define <16 x float> @test_mm512_fmsub_round_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_fmsub_round_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxord {{\.LCPI.*}}{1to16}, %zmm2, %zmm2 -; X86-NEXT: vfmadd213ps {rn-sae}, %zmm2, %zmm1, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fmsub_round_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxord {{.*}}(%rip){1to16}, %zmm2, %zmm2 -; X64-NEXT: vfmadd213ps {rn-sae}, %zmm2, %zmm1, %zmm0 -; X64-NEXT: retq -entry: - %neg = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %__A, <16 x float> %__B, <16 x float> %neg, i32 8) - ret <16 x float> %0 -} - define <16 x float> @test_mm512_mask_fmsub_round_ps(<16 x float> %__A, i16 zeroext %__U, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_mask_fmsub_round_ps: ; X86: # %bb.0: # %entry @@ -3881,27 +3563,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_mask_fmsub_round_ps_unary_fneg(<16 x float> %__A, i16 zeroext %__U, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_mask_fmsub_round_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub132ps {rn-sae}, %zmm1, %zmm2, %zmm0 {%k1} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask_fmsub_round_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub132ps {rn-sae}, %zmm1, %zmm2, %zmm0 {%k1} -; X64-NEXT: retq -entry: - %neg = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %__A, <16 x float> %__B, <16 x float> %neg, i32 8) - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> %__A - ret <16 x float> %2 -} - define <16 x float> @test_mm512_maskz_fmsub_round_ps(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_maskz_fmsub_round_ps: ; X86: # %bb.0: # %entry @@ -3923,27 +3584,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_maskz_fmsub_round_ps_unary_fneg(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_maskz_fmsub_round_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub213ps {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fmsub_round_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub213ps {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X64-NEXT: retq -entry: - %neg = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %__A, <16 x float> %__B, <16 x float> %neg, i32 8) - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> zeroinitializer - ret <16 x float> %2 -} - define <16 x float> @test_mm512_fnmadd_round_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_fnmadd_round_ps: ; X86: # %bb.0: # %entry @@ -3962,24 +3602,6 @@ entry: ret <16 x float> %0 } -define <16 x float> @test_mm512_fnmadd_round_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_fnmadd_round_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxord {{\.LCPI.*}}{1to16}, %zmm0, %zmm0 -; X86-NEXT: vfmadd213ps {rn-sae}, %zmm2, %zmm1, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fnmadd_round_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxord {{.*}}(%rip){1to16}, %zmm0, %zmm0 -; X64-NEXT: vfmadd213ps {rn-sae}, %zmm2, %zmm1, %zmm0 -; X64-NEXT: retq -entry: - %neg = fneg <16 x float> %__A - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %neg, <16 x float> %__B, <16 x float> %__C, i32 8) - ret <16 x float> %0 -} - define <16 x float> @test_mm512_mask3_fnmadd_round_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C, i16 zeroext %__U) { ; X86-LABEL: test_mm512_mask3_fnmadd_round_ps: ; X86: # %bb.0: # %entry @@ -4003,29 +3625,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_mask3_fnmadd_round_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C, i16 zeroext %__U) { -; X86-LABEL: test_mm512_mask3_fnmadd_round_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd231ps {rn-sae}, %zmm1, %zmm0, %zmm2 {%k1} -; X86-NEXT: vmovaps %zmm2, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask3_fnmadd_round_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd231ps {rn-sae}, %zmm1, %zmm0, %zmm2 {%k1} -; X64-NEXT: vmovaps %zmm2, %zmm0 -; X64-NEXT: retq -entry: - %neg = fneg <16 x float> %__A - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %neg, <16 x float> %__B, <16 x float> %__C, i32 8) - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> %__C - ret <16 x float> %2 -} - define <16 x float> @test_mm512_maskz_fnmadd_round_ps(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_maskz_fnmadd_round_ps: ; X86: # %bb.0: # %entry @@ -4047,27 +3646,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_maskz_fnmadd_round_ps_unary_fneg(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_maskz_fnmadd_round_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd213ps {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmadd_round_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd213ps {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X64-NEXT: retq -entry: - %neg = fneg <16 x float> %__A - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %neg, <16 x float> %__B, <16 x float> %__C, i32 8) - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> zeroinitializer - ret <16 x float> %2 -} - define <16 x float> @test_mm512_fnmsub_round_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; CHECK-LABEL: test_mm512_fnmsub_round_ps: ; CHECK: # %bb.0: # %entry @@ -4083,21 +3661,6 @@ entry: ret <16 x float> %0 } -define <16 x float> @test_mm512_fnmsub_round_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; CHECK-LABEL: test_mm512_fnmsub_round_ps_unary_fneg: -; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vpbroadcastd {{.*#+}} zmm3 = [-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0] -; CHECK-NEXT: vpxord %zmm3, %zmm0, %zmm4 -; CHECK-NEXT: vpxord %zmm3, %zmm2, %zmm0 -; CHECK-NEXT: vfmadd231ps {rn-sae}, %zmm4, %zmm1, %zmm0 -; CHECK-NEXT: ret{{[l|q]}} -entry: - %neg = fneg <16 x float> %__A - %neg1 = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %neg, <16 x float> %__B, <16 x float> %neg1, i32 8) - ret <16 x float> %0 -} - define <16 x float> @test_mm512_maskz_fnmsub_round_ps(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_maskz_fnmsub_round_ps: ; X86: # %bb.0: # %entry @@ -4120,28 +3683,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_maskz_fnmsub_round_ps_unary_fneg(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_maskz_fnmsub_round_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmsub213ps {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmsub_round_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmsub213ps {rn-sae}, %zmm2, %zmm1, %zmm0 {%k1} {z} -; X64-NEXT: retq -entry: - %neg = fneg <16 x float> %__A - %neg1 = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.x86.avx512.vfmadd.ps.512(<16 x float> %neg, <16 x float> %__B, <16 x float> %neg1, i32 8) - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> zeroinitializer - ret <16 x float> %2 -} - define <16 x float> @test_mm512_fmadd_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; CHECK-LABEL: test_mm512_fmadd_ps: ; CHECK: # %bb.0: # %entry @@ -4232,24 +3773,6 @@ entry: ret <16 x float> %0 } -define <16 x float> @test_mm512_fmsub_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_fmsub_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxord {{\.LCPI.*}}{1to16}, %zmm2, %zmm2 -; X86-NEXT: vfmadd213ps {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fmsub_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxord {{.*}}(%rip){1to16}, %zmm2, %zmm2 -; X64-NEXT: vfmadd213ps {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %__A, <16 x float> %__B, <16 x float> %neg.i) #10 - ret <16 x float> %0 -} - define <16 x float> @test_mm512_mask_fmsub_ps(<16 x float> %__A, i16 zeroext %__U, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_mask_fmsub_ps: ; X86: # %bb.0: # %entry @@ -4271,27 +3794,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_mask_fmsub_ps_unary_fneg(<16 x float> %__A, i16 zeroext %__U, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_mask_fmsub_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub132ps {{.*#+}} zmm0 = (zmm0 * zmm1) - zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask_fmsub_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub132ps {{.*#+}} zmm0 = (zmm0 * zmm1) - zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %__A, <16 x float> %__B, <16 x float> %neg.i) #10 - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> %__A - ret <16 x float> %2 -} - define <16 x float> @test_mm512_maskz_fmsub_ps(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_maskz_fmsub_ps: ; X86: # %bb.0: # %entry @@ -4313,27 +3815,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_maskz_fmsub_ps_unary_fneg(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_maskz_fmsub_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsub213ps {{.*#+}} zmm0 = (zmm1 * zmm0) - zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fmsub_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsub213ps {{.*#+}} zmm0 = (zmm1 * zmm0) - zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %__A, <16 x float> %__B, <16 x float> %neg.i) #10 - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> zeroinitializer - ret <16 x float> %2 -} - define <16 x float> @test_mm512_fnmadd_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_fnmadd_ps: ; X86: # %bb.0: # %entry @@ -4352,24 +3833,6 @@ entry: ret <16 x float> %0 } -define <16 x float> @test_mm512_fnmadd_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_fnmadd_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxord {{\.LCPI.*}}{1to16}, %zmm0, %zmm0 -; X86-NEXT: vfmadd213ps {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fnmadd_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxord {{.*}}(%rip){1to16}, %zmm0, %zmm0 -; X64-NEXT: vfmadd213ps {{.*#+}} zmm0 = (zmm1 * zmm0) + zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <16 x float> %__A - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %neg.i, <16 x float> %__B, <16 x float> %__C) #10 - ret <16 x float> %0 -} - define <16 x float> @test_mm512_mask3_fnmadd_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C, i16 zeroext %__U) { ; X86-LABEL: test_mm512_mask3_fnmadd_ps: ; X86: # %bb.0: # %entry @@ -4393,29 +3856,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_mask3_fnmadd_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C, i16 zeroext %__U) { -; X86-LABEL: test_mm512_mask3_fnmadd_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd231ps {{.*#+}} zmm2 = -(zmm0 * zmm1) + zmm2 -; X86-NEXT: vmovaps %zmm2, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask3_fnmadd_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd231ps {{.*#+}} zmm2 = -(zmm0 * zmm1) + zmm2 -; X64-NEXT: vmovaps %zmm2, %zmm0 -; X64-NEXT: retq -entry: - %neg.i = fneg <16 x float> %__A - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %neg.i, <16 x float> %__B, <16 x float> %__C) #10 - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> %__C - ret <16 x float> %2 -} - define <16 x float> @test_mm512_maskz_fnmadd_ps(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_maskz_fnmadd_ps: ; X86: # %bb.0: # %entry @@ -4437,27 +3877,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_maskz_fnmadd_ps_unary_fneg(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_maskz_fnmadd_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmadd213ps {{.*#+}} zmm0 = -(zmm1 * zmm0) + zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmadd_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmadd213ps {{.*#+}} zmm0 = -(zmm1 * zmm0) + zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <16 x float> %__A - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %neg.i, <16 x float> %__B, <16 x float> %__C) #10 - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> zeroinitializer - ret <16 x float> %2 -} - define <16 x float> @test_mm512_fnmsub_ps(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; CHECK-LABEL: test_mm512_fnmsub_ps: ; CHECK: # %bb.0: # %entry @@ -4473,21 +3892,6 @@ entry: ret <16 x float> %0 } -define <16 x float> @test_mm512_fnmsub_ps_unary_fneg(<16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; CHECK-LABEL: test_mm512_fnmsub_ps_unary_fneg: -; CHECK: # %bb.0: # %entry -; CHECK-NEXT: vpbroadcastd {{.*#+}} zmm3 = [-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0,-0.0E+0] -; CHECK-NEXT: vpxord %zmm3, %zmm0, %zmm4 -; CHECK-NEXT: vpxord %zmm3, %zmm2, %zmm0 -; CHECK-NEXT: vfmadd231ps {{.*#+}} zmm0 = (zmm1 * zmm4) + zmm0 -; CHECK-NEXT: ret{{[l|q]}} -entry: - %neg.i = fneg <16 x float> %__A - %neg1.i = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %neg.i, <16 x float> %__B, <16 x float> %neg1.i) #10 - ret <16 x float> %0 -} - define <16 x float> @test_mm512_maskz_fnmsub_ps(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { ; X86-LABEL: test_mm512_maskz_fnmsub_ps: ; X86: # %bb.0: # %entry @@ -4510,28 +3914,6 @@ entry: ret <16 x float> %2 } -define <16 x float> @test_mm512_maskz_fnmsub_ps_unary_fneg(i16 zeroext %__U, <16 x float> %__A, <16 x float> %__B, <16 x float> %__C) { -; X86-LABEL: test_mm512_maskz_fnmsub_ps_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movzwl {{[0-9]+}}(%esp), %eax -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfnmsub213ps {{.*#+}} zmm0 = -(zmm1 * zmm0) - zmm2 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_maskz_fnmsub_ps_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfnmsub213ps {{.*#+}} zmm0 = -(zmm1 * zmm0) - zmm2 -; X64-NEXT: retq -entry: - %neg.i = fneg <16 x float> %__A - %neg1.i = fneg <16 x float> %__C - %0 = tail call <16 x float> @llvm.fma.v16f32(<16 x float> %neg.i, <16 x float> %__B, <16 x float> %neg1.i) #10 - %1 = bitcast i16 %__U to <16 x i1> - %2 = select <16 x i1> %1, <16 x float> %0, <16 x float> zeroinitializer - ret <16 x float> %2 -} - define <8 x double> @test_mm512_fmaddsub_round_pd(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; CHECK-LABEL: test_mm512_fmaddsub_round_pd: ; CHECK: # %bb.0: # %entry @@ -4624,24 +4006,6 @@ entry: ret <8 x double> %0 } -define <8 x double> @test_mm512_fmsubadd_round_pd_unary_fneg(<8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_fmsubadd_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: vpxorq {{\.LCPI.*}}{1to8}, %zmm2, %zmm2 -; X86-NEXT: vfmaddsub213pd {rn-sae}, %zmm2, %zmm1, %zmm0 -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_fmsubadd_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: vpxorq {{.*}}(%rip){1to8}, %zmm2, %zmm2 -; X64-NEXT: vfmaddsub213pd {rn-sae}, %zmm2, %zmm1, %zmm0 -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.x86.avx512.vfmaddsub.pd.512(<8 x double> %__A, <8 x double> %__B, <8 x double> %neg, i32 8) - ret <8 x double> %0 -} - define <8 x double> @test_mm512_mask_fmsubadd_round_pd(<8 x double> %__A, i8 zeroext %__U, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_mask_fmsubadd_round_pd: ; X86: # %bb.0: # %entry @@ -4663,27 +4027,6 @@ entry: ret <8 x double> %2 } -define <8 x double> @test_mm512_mask_fmsubadd_round_pd_unary_fneg(<8 x double> %__A, i8 zeroext %__U, <8 x double> %__B, <8 x double> %__C) { -; X86-LABEL: test_mm512_mask_fmsubadd_round_pd_unary_fneg: -; X86: # %bb.0: # %entry -; X86-NEXT: movb {{[0-9]+}}(%esp), %al -; X86-NEXT: kmovw %eax, %k1 -; X86-NEXT: vfmsubadd132pd {rn-sae}, %zmm1, %zmm2, %zmm0 {%k1} -; X86-NEXT: retl -; -; X64-LABEL: test_mm512_mask_fmsubadd_round_pd_unary_fneg: -; X64: # %bb.0: # %entry -; X64-NEXT: kmovw %edi, %k1 -; X64-NEXT: vfmsubadd132pd {rn-sae}, %zmm1, %zmm2, %zmm0 {%k1} -; X64-NEXT: retq -entry: - %neg = fneg <8 x double> %__C - %0 = tail call <8 x double> @llvm.x86.avx512.vfmaddsub.pd.512(<8 x double> %__A, <8 x double> %__B, <8 x double> %neg, i32 8) - %1 = bitcast i8 %__U to <8 x i1> - %2 = select <8 x i1> %1, <8 x double> %0, <8 x double> %__A - ret <8 x double> %2 -} - define <8 x double> @test_mm512_maskz_fmsubadd_round_pd(i8 zeroext %__U, <8 x double> %__A, <8 x double> %__B, <8 x double> %__C) { ; X86-LABEL: test_mm512_maskz_fmsubadd_round_pd: ; X86: # %bb.0: # %entry -- 2.40.0