-; RUN: llc -mtriple=x86_64-linux -mcpu=corei7 < %s | FileCheck %s
+; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
+; RUN: llc < %s -mtriple=x86_64-linux -mcpu=corei7 | FileCheck %s
+
; This fixes a missing cases in the MI scheduler's constrainLocalCopy exposed by
; PR21792
@stuff = external constant [256 x double], align 16
define void @func(<4 x float> %vx) {
+; CHECK-LABEL: func:
+; CHECK: # BB#0: # %entry
+; CHECK-NEXT: pushq %rax
+; CHECK-NEXT: .Lcfi0:
+; CHECK-NEXT: .cfi_def_cfa_offset 16
+; CHECK-NEXT: pand {{.*}}(%rip), %xmm0
+; CHECK-NEXT: pextrq $1, %xmm0, %rcx
+; CHECK-NEXT: movd %xmm0, %rax
+; CHECK-NEXT: movq %rax, %r9
+; CHECK-NEXT: shrq $32, %r9
+; CHECK-NEXT: andl $2032, %eax # imm = 0x7F0
+; CHECK-NEXT: leaq stuff(%rax), %rdi
+; CHECK-NEXT: leaq stuff(%r9), %rsi
+; CHECK-NEXT: movl %ecx, %edx
+; CHECK-NEXT: andl $2032, %edx # imm = 0x7F0
+; CHECK-NEXT: leaq stuff(%rdx), %rdx
+; CHECK-NEXT: sarq $32, %rcx
+; CHECK-NEXT: leaq stuff(%rcx), %rcx
+; CHECK-NEXT: leaq stuff+8(%rax), %r8
+; CHECK-NEXT: leaq stuff+8(%r9), %r9
+; CHECK-NEXT: callq toto
+; CHECK-NEXT: popq %rax
+; CHECK-NEXT: retq
entry:
%tmp2 = bitcast <4 x float> %vx to <2 x i64>
%and.i = and <2 x i64> %tmp2, <i64 8727373547504, i64 8727373547504>
%tmp17 = bitcast i8* %add.ptr51 to double*
call void @toto(double* %tmp4, double* %tmp5, double* %tmp6, double* %tmp7, double* %tmp16, double* %tmp17)
ret void
-; CHECK-LABEL: func:
-; CHECK: pextrq $1, %xmm0,
-; CHECK-NEXT: movd %xmm0, %r[[AX:..]]
-; CHECK-NEXT: movq %r[[AX]],
-; CHECK-NEXT: shrq $32, %r9
}
declare void @toto(double*, double*, double*, double*, double*, double*)