From: Craig Topper Date: Tue, 27 Sep 2016 06:44:27 +0000 (+0000) Subject: [X86] Expand all-ones-vector test to cover 256-bit and 512-bit vectors. X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=bdc4313f6aa7cde753e871776699bb3d44c81f47;p=llvm [X86] Expand all-ones-vector test to cover 256-bit and 512-bit vectors. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@282472 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/test/CodeGen/X86/all-ones-vector.ll b/test/CodeGen/X86/all-ones-vector.ll index 9707eb57ae4..8e050ee2404 100644 --- a/test/CodeGen/X86/all-ones-vector.ll +++ b/test/CodeGen/X86/all-ones-vector.ll @@ -1,8 +1,14 @@ ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py -; RUN: llc < %s -mtriple=i386-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X32 --check-prefix=X32-SSE -; RUN: llc < %s -mtriple=i386-unknown -mattr=+avx | FileCheck %s --check-prefix=X32 --check-prefix=X32-AVX -; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64 --check-prefix=X64-SSE -; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx | FileCheck %s --check-prefix=X64 --check-prefix=X64-AVX +; RUN: llc < %s -mtriple=i386-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X32-SSE +; RUN: llc < %s -mtriple=i386-unknown -mattr=+avx | FileCheck %s --check-prefix=X32-AVX --check-prefix=X32-AVX1 +; RUN: llc < %s -mtriple=i386-unknown -mattr=+avx2 | FileCheck %s --check-prefix=X32-AVX --check-prefix=X32-AVX256 --check-prefix=X32-AVX2 +; RUN: llc < %s -mtriple=i386-unknown -mcpu=knl | FileCheck %s --check-prefix=X32-AVX --check-prefix=X32-AVX256 --check-prefix=X32-AVX512 --check-prefix=X32-KNL +; RUN: llc < %s -mtriple=i386-unknown -mcpu=skx | FileCheck %s --check-prefix=X32-AVX --check-prefix=X32-AVX256 --check-prefix=X32-AVX512 --check-prefix=X32-SKX +; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+sse2 | FileCheck %s --check-prefix=X64-SSE +; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx | FileCheck %s --check-prefix=X64-AVX --check-prefix=X64-AVX1 +; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+avx2 | FileCheck %s --check-prefix=X64-AVX --check-prefix=X64-AVX256 --check-prefix=X64-AVX2 +; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=knl | FileCheck %s --check-prefix=X64-AVX --check-prefix=X64-AVX256 --check-prefix=X64-AVX512 --check-prefix=X64-KNL +; RUN: llc < %s -mtriple=x86_64-unknown -mcpu=skx | FileCheck %s --check-prefix=X64-AVX --check-prefix=X64-AVX256 --check-prefix=X64-AVX512 --check-prefix=X64-SKX define <16 x i8> @coo() nounwind { ; X32-SSE-LABEL: coo: @@ -141,3 +147,579 @@ define <4 x float> @foo() nounwind { ; X64-AVX-NEXT: retq ret <4 x float> } + +define <32 x i8> @coo256() nounwind { +; X32-SSE-LABEL: coo256: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: coo256: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: retl +; +; X32-AVX256-LABEL: coo256: +; X32-AVX256: # BB#0: +; X32-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX256-NEXT: retl +; +; X64-SSE-LABEL: coo256: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: coo256: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: retq +; +; X64-AVX256-LABEL: coo256: +; X64-AVX256: # BB#0: +; X64-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX256-NEXT: retq + ret <32 x i8> +} + +define <16 x i16> @soo256() nounwind { +; X32-SSE-LABEL: soo256: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: soo256: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: retl +; +; X32-AVX256-LABEL: soo256: +; X32-AVX256: # BB#0: +; X32-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX256-NEXT: retl +; +; X64-SSE-LABEL: soo256: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: soo256: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: retq +; +; X64-AVX256-LABEL: soo256: +; X64-AVX256: # BB#0: +; X64-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX256-NEXT: retq + ret <16 x i16> +} + +define <8 x i32> @ioo256() nounwind { +; X32-SSE-LABEL: ioo256: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: ioo256: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: retl +; +; X32-AVX256-LABEL: ioo256: +; X32-AVX256: # BB#0: +; X32-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX256-NEXT: retl +; +; X64-SSE-LABEL: ioo256: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: ioo256: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: retq +; +; X64-AVX256-LABEL: ioo256: +; X64-AVX256: # BB#0: +; X64-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX256-NEXT: retq + ret <8 x i32> +} + +define <4 x i64> @loo256() nounwind { +; X32-SSE-LABEL: loo256: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: loo256: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: retl +; +; X32-AVX256-LABEL: loo256: +; X32-AVX256: # BB#0: +; X32-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX256-NEXT: retl +; +; X64-SSE-LABEL: loo256: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: loo256: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: retq +; +; X64-AVX256-LABEL: loo256: +; X64-AVX256: # BB#0: +; X64-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX256-NEXT: retq + ret <4 x i64> +} + +define <4 x double> @doo256() nounwind { +; X32-SSE-LABEL: doo256: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: doo256: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: retl +; +; X32-AVX256-LABEL: doo256: +; X32-AVX256: # BB#0: +; X32-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX256-NEXT: retl +; +; X64-SSE-LABEL: doo256: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: doo256: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: retq +; +; X64-AVX256-LABEL: doo256: +; X64-AVX256: # BB#0: +; X64-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX256-NEXT: retq + ret <4 x double> +} + +define <8 x float> @foo256() nounwind { +; X32-SSE-LABEL: foo256: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: foo256: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: retl +; +; X32-AVX256-LABEL: foo256: +; X32-AVX256: # BB#0: +; X32-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX256-NEXT: retl +; +; X64-SSE-LABEL: foo256: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: foo256: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: retq +; +; X64-AVX256-LABEL: foo256: +; X64-AVX256: # BB#0: +; X64-AVX256-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX256-NEXT: retq + ret <8 x float> +} + +define <64 x i8> @coo512() nounwind { +; X32-SSE-LABEL: coo512: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X32-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: coo512: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X32-AVX1-NEXT: retl +; +; X32-AVX2-LABEL: coo512: +; X32-AVX2: # BB#0: +; X32-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-AVX2-NEXT: retl +; +; X32-KNL-LABEL: coo512: +; X32-KNL: # BB#0: +; X32-KNL-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-KNL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-KNL-NEXT: retl +; +; X32-SKX-LABEL: coo512: +; X32-SKX: # BB#0: +; X32-SKX-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X32-SKX-NEXT: retl +; +; X64-SSE-LABEL: coo512: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X64-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: coo512: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X64-AVX1-NEXT: retq +; +; X64-AVX2-LABEL: coo512: +; X64-AVX2: # BB#0: +; X64-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-AVX2-NEXT: retq +; +; X64-KNL-LABEL: coo512: +; X64-KNL: # BB#0: +; X64-KNL-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-KNL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-KNL-NEXT: retq +; +; X64-SKX-LABEL: coo512: +; X64-SKX: # BB#0: +; X64-SKX-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X64-SKX-NEXT: retq + ret <64 x i8> +} + +define <32 x i16> @soo512() nounwind { +; X32-SSE-LABEL: soo512: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X32-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: soo512: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X32-AVX1-NEXT: retl +; +; X32-AVX2-LABEL: soo512: +; X32-AVX2: # BB#0: +; X32-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-AVX2-NEXT: retl +; +; X32-KNL-LABEL: soo512: +; X32-KNL: # BB#0: +; X32-KNL-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-KNL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-KNL-NEXT: retl +; +; X32-SKX-LABEL: soo512: +; X32-SKX: # BB#0: +; X32-SKX-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X32-SKX-NEXT: retl +; +; X64-SSE-LABEL: soo512: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X64-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: soo512: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X64-AVX1-NEXT: retq +; +; X64-AVX2-LABEL: soo512: +; X64-AVX2: # BB#0: +; X64-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-AVX2-NEXT: retq +; +; X64-KNL-LABEL: soo512: +; X64-KNL: # BB#0: +; X64-KNL-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-KNL-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-KNL-NEXT: retq +; +; X64-SKX-LABEL: soo512: +; X64-SKX: # BB#0: +; X64-SKX-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X64-SKX-NEXT: retq + ret <32 x i16> +} + +define <16 x i32> @ioo512() nounwind { +; X32-SSE-LABEL: ioo512: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X32-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: ioo512: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X32-AVX1-NEXT: retl +; +; X32-AVX2-LABEL: ioo512: +; X32-AVX2: # BB#0: +; X32-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-AVX2-NEXT: retl +; +; X32-AVX512-LABEL: ioo512: +; X32-AVX512: # BB#0: +; X32-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X32-AVX512-NEXT: retl +; +; X64-SSE-LABEL: ioo512: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X64-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: ioo512: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X64-AVX1-NEXT: retq +; +; X64-AVX2-LABEL: ioo512: +; X64-AVX2: # BB#0: +; X64-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-AVX2-NEXT: retq +; +; X64-AVX512-LABEL: ioo512: +; X64-AVX512: # BB#0: +; X64-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X64-AVX512-NEXT: retq + ret <16 x i32> +} + +define <8 x i64> @loo512() nounwind { +; X32-SSE-LABEL: loo512: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X32-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: loo512: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X32-AVX1-NEXT: retl +; +; X32-AVX2-LABEL: loo512: +; X32-AVX2: # BB#0: +; X32-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-AVX2-NEXT: retl +; +; X32-AVX512-LABEL: loo512: +; X32-AVX512: # BB#0: +; X32-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X32-AVX512-NEXT: retl +; +; X64-SSE-LABEL: loo512: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X64-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: loo512: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X64-AVX1-NEXT: retq +; +; X64-AVX2-LABEL: loo512: +; X64-AVX2: # BB#0: +; X64-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-AVX2-NEXT: retq +; +; X64-AVX512-LABEL: loo512: +; X64-AVX512: # BB#0: +; X64-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X64-AVX512-NEXT: retq + ret <8 x i64> +} + +define <8 x double> @doo512() nounwind { +; X32-SSE-LABEL: doo512: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X32-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: doo512: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X32-AVX1-NEXT: retl +; +; X32-AVX2-LABEL: doo512: +; X32-AVX2: # BB#0: +; X32-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-AVX2-NEXT: retl +; +; X32-AVX512-LABEL: doo512: +; X32-AVX512: # BB#0: +; X32-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X32-AVX512-NEXT: retl +; +; X64-SSE-LABEL: doo512: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X64-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: doo512: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X64-AVX1-NEXT: retq +; +; X64-AVX2-LABEL: doo512: +; X64-AVX2: # BB#0: +; X64-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-AVX2-NEXT: retq +; +; X64-AVX512-LABEL: doo512: +; X64-AVX512: # BB#0: +; X64-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X64-AVX512-NEXT: retq + ret <8 x double> +} + +define <16 x float> @foo512() nounwind { +; X32-SSE-LABEL: foo512: +; X32-SSE: # BB#0: +; X32-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X32-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X32-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X32-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X32-SSE-NEXT: retl +; +; X32-AVX1-LABEL: foo512: +; X32-AVX1: # BB#0: +; X32-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X32-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X32-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X32-AVX1-NEXT: retl +; +; X32-AVX2-LABEL: foo512: +; X32-AVX2: # BB#0: +; X32-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X32-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X32-AVX2-NEXT: retl +; +; X32-AVX512-LABEL: foo512: +; X32-AVX512: # BB#0: +; X32-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X32-AVX512-NEXT: retl +; +; X64-SSE-LABEL: foo512: +; X64-SSE: # BB#0: +; X64-SSE-NEXT: pcmpeqd %xmm0, %xmm0 +; X64-SSE-NEXT: pcmpeqd %xmm1, %xmm1 +; X64-SSE-NEXT: pcmpeqd %xmm2, %xmm2 +; X64-SSE-NEXT: pcmpeqd %xmm3, %xmm3 +; X64-SSE-NEXT: retq +; +; X64-AVX1-LABEL: foo512: +; X64-AVX1: # BB#0: +; X64-AVX1-NEXT: vpcmpeqd %xmm0, %xmm0, %xmm0 +; X64-AVX1-NEXT: vinsertf128 $1, %xmm0, %ymm0, %ymm0 +; X64-AVX1-NEXT: vmovaps %ymm0, %ymm1 +; X64-AVX1-NEXT: retq +; +; X64-AVX2-LABEL: foo512: +; X64-AVX2: # BB#0: +; X64-AVX2-NEXT: vpcmpeqd %ymm0, %ymm0, %ymm0 +; X64-AVX2-NEXT: vpcmpeqd %ymm1, %ymm1, %ymm1 +; X64-AVX2-NEXT: retq +; +; X64-AVX512-LABEL: foo512: +; X64-AVX512: # BB#0: +; X64-AVX512-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0 +; X64-AVX512-NEXT: retq + ret <16 x float> +}