From: Simon Pilgrim Date: Sun, 10 Dec 2017 13:41:29 +0000 (+0000) Subject: Regenerate some AVX2+ scheduling tests that got missed X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=1c5c6081ed0ba9c17445bb44d800b1d36ae07b6a;p=llvm Regenerate some AVX2+ scheduling tests that got missed git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@320307 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/test/CodeGen/X86/avx2-schedule.ll b/test/CodeGen/X86/avx2-schedule.ll index cb73421c8ba..d8dc3bb84f5 100644 --- a/test/CodeGen/X86/avx2-schedule.ll +++ b/test/CodeGen/X86/avx2-schedule.ll @@ -178,7 +178,7 @@ define <4 x i32> @test_extracti128(<8 x i32> %a0, <8 x i32> %a1, <4 x i32> *%a2) ; GENERIC-NEXT: vpsubd %ymm1, %ymm0, %ymm0 # sched: [3:1.00] ; GENERIC-NEXT: vextracti128 $1, %ymm0, %xmm0 # sched: [1:1.00] ; GENERIC-NEXT: vextracti128 $1, %ymm2, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_extracti128: @@ -482,7 +482,7 @@ define <4 x float> @test_gatherqps_ymm(<4 x float> %a0, i8* %a1, <4 x i64> %a2, ; GENERIC-LABEL: test_gatherqps_ymm: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vgatherqps %xmm2, (%rdi,%ymm1,4), %xmm0 # sched: [4:0.50] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_gatherqps_ymm: @@ -2926,7 +2926,7 @@ define <4 x i32> @test_pgatherqd_ymm(<4 x i32> %a0, i8* %a1, <4 x i64> %a2, <4 x ; GENERIC-LABEL: test_pgatherqd_ymm: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vpgatherqd %xmm2, (%rdi,%ymm1,2), %xmm0 # sched: [4:0.50] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_pgatherqd_ymm: @@ -4095,7 +4095,7 @@ define i32 @test_pmovmskb(<32 x i8> %a0) { ; GENERIC-LABEL: test_pmovmskb: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vpmovmskb %ymm0, %eax # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; HASWELL-LABEL: test_pmovmskb: diff --git a/test/CodeGen/X86/avx512-schedule.ll b/test/CodeGen/X86/avx512-schedule.ll index 7d99f7d3986..3573c4db726 100755 --- a/test/CodeGen/X86/avx512-schedule.ll +++ b/test/CodeGen/X86/avx512-schedule.ll @@ -1489,7 +1489,7 @@ define <4 x float> @slto4f32(<4 x i64> %a) { ; GENERIC-LABEL: slto4f32: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvtqq2ps %ymm0, %xmm0 # sched: [4:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: slto4f32: @@ -1505,7 +1505,7 @@ define <4 x float> @ulto4f32(<4 x i64> %a) { ; GENERIC-LABEL: ulto4f32: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvtuqq2ps %ymm0, %xmm0 # sched: [4:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: ulto4f32: @@ -1580,7 +1580,7 @@ define <16 x i8> @f32to16uc(<16 x float> %f) { ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvttps2dq %zmm0, %zmm0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovdb %zmm0, %xmm0 # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: f32to16uc: @@ -1656,7 +1656,7 @@ define <8 x i16> @f64to8us(<8 x double> %f) { ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvttpd2dq %zmm0, %ymm0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovdw %ymm0, %xmm0 # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: f64to8us: @@ -1674,7 +1674,7 @@ define <8 x i8> @f64to8uc(<8 x double> %f) { ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvttpd2dq %zmm0, %ymm0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovdw %ymm0, %xmm0 # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: f64to8uc: @@ -1691,7 +1691,7 @@ define <4 x i32> @f64to4ui(<4 x double> %a) nounwind { ; GENERIC-LABEL: f64to4ui: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvttpd2udq %ymm0, %xmm0 # sched: [3:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: f64to4ui: @@ -1779,7 +1779,7 @@ define <4 x i32> @f64to4si(<4 x double> %a) { ; GENERIC-LABEL: f64to4si: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvttpd2dq %ymm0, %xmm0 # sched: [4:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: f64to4si: @@ -1813,7 +1813,7 @@ define <4 x float> @f64to4f32(<4 x double> %b) { ; GENERIC-LABEL: f64to4f32: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vcvtpd2ps %ymm0, %xmm0 # sched: [4:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: f64to4f32: @@ -1831,7 +1831,7 @@ define <4 x float> @f64to4f32_mask(<4 x double> %b, <4 x i1> %mask) { ; GENERIC-NEXT: vpslld $31, %xmm1, %xmm1 # sched: [1:1.00] ; GENERIC-NEXT: vptestmd %xmm1, %xmm1, %k1 # sched: [1:1.00] ; GENERIC-NEXT: vcvtpd2ps %ymm0, %xmm0 {%k1} {z} # sched: [3:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: f64to4f32_mask: @@ -4357,7 +4357,7 @@ define i16 @trunc_16i32_to_16i1(<16 x i32> %a) { ; GENERIC-NEXT: vptestmd %zmm0, %zmm0, %k0 # sched: [1:1.00] ; GENERIC-NEXT: kmovd %k0, %eax # sched: [1:0.33] ; GENERIC-NEXT: # kill: def %ax killed %ax killed %eax -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: trunc_16i32_to_16i1: @@ -4476,7 +4476,7 @@ define <8 x i16> @sext_8i1_8i16(<8 x i32> %a1, <8 x i32> %a2) nounwind { ; GENERIC: # %bb.0: ; GENERIC-NEXT: vpcmpgtd %ymm0, %ymm1, %k0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovm2w %k0, %xmm0 # sched: [1:0.33] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: sext_8i1_8i16: @@ -4529,7 +4529,7 @@ define void @extload_v8i64(<8 x i8>* %a, <8 x i64>* %res) { ; GENERIC: # %bb.0: ; GENERIC-NEXT: vpmovsxbq (%rdi), %zmm0 # sched: [5:1.00] ; GENERIC-NEXT: vmovdqa64 %zmm0, (%rsi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: extload_v8i64: @@ -6176,7 +6176,7 @@ define void @mov_test18(i8 * %addr, <8 x i64> %data) { ; GENERIC-LABEL: mov_test18: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovaps %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test18: @@ -6193,7 +6193,7 @@ define void @mov_test19(i8 * %addr, <16 x i32> %data) { ; GENERIC-LABEL: mov_test19: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovups %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test19: @@ -6210,7 +6210,7 @@ define void @mov_test20(i8 * %addr, <16 x i32> %data) { ; GENERIC-LABEL: mov_test20: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovaps %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test20: @@ -6242,7 +6242,7 @@ define void @mov_test22(i8 * %addr, <8 x i64> %data) { ; GENERIC-LABEL: mov_test22: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovups %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test22: @@ -6274,7 +6274,7 @@ define void @mov_test24(i8 * %addr, <8 x double> %data) { ; GENERIC-LABEL: mov_test24: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovaps %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test24: @@ -6306,7 +6306,7 @@ define void @mov_test26(i8 * %addr, <16 x float> %data) { ; GENERIC-LABEL: mov_test26: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovaps %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test26: @@ -6338,7 +6338,7 @@ define void @mov_test28(i8 * %addr, <8 x double> %data) { ; GENERIC-LABEL: mov_test28: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovups %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test28: @@ -6370,7 +6370,7 @@ define void @mov_test30(i8 * %addr, <16 x float> %data) { ; GENERIC-LABEL: mov_test30: ; GENERIC: # %bb.0: ; GENERIC-NEXT: vmovups %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: mov_test30: @@ -6952,7 +6952,7 @@ define i32 @zext_test1(<16 x i32> %a, <16 x i32> %b) { ; GENERIC-NEXT: kshiftrw $15, %k0, %k0 # sched: [1:1.00] ; GENERIC-NEXT: kmovd %k0, %eax # sched: [1:0.33] ; GENERIC-NEXT: andl $1, %eax # sched: [1:0.33] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: zext_test1: @@ -6979,7 +6979,7 @@ define i16 @zext_test2(<16 x i32> %a, <16 x i32> %b) { ; GENERIC-NEXT: kmovd %k0, %eax # sched: [1:0.33] ; GENERIC-NEXT: andl $1, %eax # sched: [1:0.33] ; GENERIC-NEXT: # kill: def %ax killed %ax killed %eax -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: zext_test2: @@ -7007,7 +7007,7 @@ define i8 @zext_test3(<16 x i32> %a, <16 x i32> %b) { ; GENERIC-NEXT: kmovd %k0, %eax # sched: [1:0.33] ; GENERIC-NEXT: andb $1, %al # sched: [1:0.33] ; GENERIC-NEXT: # kill: def %al killed %al killed %eax -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: zext_test3: @@ -7059,7 +7059,7 @@ define <4 x i32> @test4(<4 x i64> %x, <4 x i64> %y, <4 x i64> %x1, <4 x i64> %y1 ; GENERIC-NEXT: vpcmpgtq %ymm3, %ymm2, %k1 # sched: [3:1.00] ; GENERIC-NEXT: kandnw %k0, %k1, %k0 # sched: [1:1.00] ; GENERIC-NEXT: vpmovm2d %k0, %xmm0 # sched: [1:0.33] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: test4: @@ -7152,12 +7152,12 @@ define <16 x i8> @vcmp_test8(<16 x i32>%a, <16 x i32>%b, i32 %a1, i32 %b1) { ; GENERIC-NEXT: # %bb.2: ; GENERIC-NEXT: vpcmpltud %zmm2, %zmm1, %k0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovm2b %k0, %xmm0 # sched: [1:0.33] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; GENERIC-NEXT: .LBB386_1: ; GENERIC-NEXT: vpcmpgtd %zmm2, %zmm0, %k0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovm2b %k0, %xmm0 # sched: [1:0.33] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: vcmp_test8: @@ -7711,11 +7711,11 @@ define void @ktest_1(<8 x double> %in, double * %base) { ; GENERIC-NEXT: je .LBB410_2 # sched: [1:1.00] ; GENERIC-NEXT: # %bb.1: # %L1 ; GENERIC-NEXT: vmovapd %zmm0, (%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; GENERIC-NEXT: .LBB410_2: # %L2 ; GENERIC-NEXT: vmovapd %zmm0, 8(%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: ktest_1: @@ -7781,12 +7781,12 @@ define void @ktest_2(<32 x float> %in, float * %base) { ; GENERIC-NEXT: # %bb.1: # %L1 ; GENERIC-NEXT: vmovaps %zmm0, (%rdi) # sched: [1:1.00] ; GENERIC-NEXT: vmovaps %zmm1, 64(%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; GENERIC-NEXT: .LBB411_2: # %L2 ; GENERIC-NEXT: vmovaps %zmm0, 4(%rdi) # sched: [1:1.00] ; GENERIC-NEXT: vmovaps %zmm1, 68(%rdi) # sched: [1:1.00] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: ktest_2: @@ -8004,7 +8004,7 @@ define void @store_32i1(<32 x i1>* %a, <32 x i1> %v) { ; GENERIC-NEXT: vpsllw $7, %ymm0, %ymm0 # sched: [1:1.00] ; GENERIC-NEXT: vpmovb2m %ymm0, %k0 # sched: [1:0.33] ; GENERIC-NEXT: kmovd %k0, (%rdi) -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: store_32i1: @@ -8024,7 +8024,7 @@ define void @store_32i1_1(<32 x i1>* %a, <32 x i16> %v) { ; GENERIC-NEXT: vpsllw $15, %zmm0, %zmm0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovw2m %zmm0, %k0 # sched: [1:0.33] ; GENERIC-NEXT: kmovd %k0, (%rdi) -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: store_32i1_1: @@ -8047,7 +8047,7 @@ define void @store_64i1(<64 x i1>* %a, <64 x i1> %v) { ; GENERIC-NEXT: vpsllw $7, %zmm0, %zmm0 # sched: [3:1.00] ; GENERIC-NEXT: vpmovb2m %zmm0, %k0 # sched: [1:0.33] ; GENERIC-NEXT: kmovq %k0, (%rdi) -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: store_64i1: @@ -8068,7 +8068,7 @@ define i32 @test_bitcast_v8i1_zext(<16 x i32> %a) { ; GENERIC-NEXT: vpcmpeqd %zmm1, %zmm0, %k0 # sched: [3:1.00] ; GENERIC-NEXT: kmovb %k0, %eax # sched: [1:0.33] ; GENERIC-NEXT: addl %eax, %eax # sched: [1:0.33] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: test_bitcast_v8i1_zext: @@ -8094,7 +8094,7 @@ define i32 @test_bitcast_v16i1_zext(<16 x i32> %a) { ; GENERIC-NEXT: vpcmpeqd %zmm1, %zmm0, %k0 # sched: [3:1.00] ; GENERIC-NEXT: kmovw %k0, %eax # sched: [1:0.33] ; GENERIC-NEXT: addl %eax, %eax # sched: [1:0.33] -; GENERIC-NEXT: vzeroupper +; GENERIC-NEXT: vzeroupper # sched: [100:0.33] ; GENERIC-NEXT: retq # sched: [1:1.00] ; ; SKX-LABEL: test_bitcast_v16i1_zext: