From: Simon Pilgrim Date: Thu, 11 Apr 2019 14:48:46 +0000 (+0000) Subject: [X86][AVX] Add X86ISD::VPERMV3 demandedelts test X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=d0586349ae5489f04f70ea1dbab4f1f9d8183c95;p=llvm [X86][AVX] Add X86ISD::VPERMV3 demandedelts test git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@358175 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll b/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll index b8efb26d6fc..eee3fe26a55 100644 --- a/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll +++ b/test/CodeGen/X86/vector-shuffle-combining-avx512bw.ll @@ -918,6 +918,34 @@ define <8 x double> @combine_vpermi2var_vpermt2var_8f64_as_vperm2(<8 x double> % ret <8 x double> %res1 } +define <8 x double> @combine_vpermi2var_8f64_as_permpd(<8 x double> %x0, <8 x double> %x1, i64 %a2) { +; X86-LABEL: combine_vpermi2var_8f64_as_permpd: +; X86: # %bb.0: +; X86-NEXT: movl $2, %eax +; X86-NEXT: vmovd %eax, %xmm2 +; X86-NEXT: vmovq {{.*#+}} xmm3 = mem[0],zero +; X86-NEXT: vpunpcklqdq {{.*#+}} xmm2 = xmm3[0],xmm2[0] +; X86-NEXT: vinserti128 $1, {{\.LCPI.*}}, %ymm2, %ymm2 +; X86-NEXT: vinserti64x4 $1, {{\.LCPI.*}}, %zmm2, %zmm2 +; X86-NEXT: vpermi2pd %zmm1, %zmm0, %zmm2 +; X86-NEXT: vpermpd {{.*#+}} zmm0 = zmm2[2,3,0,1,6,7,4,5] +; X86-NEXT: retl +; +; X64-LABEL: combine_vpermi2var_8f64_as_permpd: +; X64: # %bb.0: +; X64-NEXT: vmovdqa {{.*#+}} xmm2 = +; X64-NEXT: vpinsrq $0, %rdi, %xmm2, %xmm2 +; X64-NEXT: vmovdqa64 {{.*#+}} zmm3 = +; X64-NEXT: vinserti32x4 $0, %xmm2, %zmm3, %zmm2 +; X64-NEXT: vpermi2pd %zmm1, %zmm0, %zmm2 +; X64-NEXT: vpermpd {{.*#+}} zmm0 = zmm2[2,3,0,1,6,7,4,5] +; X64-NEXT: retq + %res0 = insertelement <8 x i64> , i64 %a2, i32 0 + %res1 = call <8 x double> @llvm.x86.avx512.mask.vpermi2var.pd.512(<8 x double> %x0, <8 x i64> %res0, <8 x double> %x1, i8 -1) + %res2 = shufflevector <8 x double> %res1, <8 x double> undef, <8 x i32> + ret <8 x double> %res2 +} + define <16 x i32> @combine_vpermi2var_vpermt2var_16i32_as_vpermd(<16 x i32> %x0, <16 x i32> %x1) { ; CHECK-LABEL: combine_vpermi2var_vpermt2var_16i32_as_vpermd: ; CHECK: # %bb.0: