Add test that verifies we don't peel loops in optsize functions. NFC.

author Michael Kuperstein <mkuper@google.com>

Wed, 11 Jan 2017 21:42:51 +0000 (21:42 +0000)

committer Michael Kuperstein <mkuper@google.com>

Wed, 11 Jan 2017 21:42:51 +0000 (21:42 +0000)
author Michael Kuperstein <mkuper@google.com>
Wed, 11 Jan 2017 21:42:51 +0000 (21:42 +0000)
committer Michael Kuperstein <mkuper@google.com>
Wed, 11 Jan 2017 21:42:51 +0000 (21:42 +0000)
diff --git a/test/Transforms/LoopUnroll/peel-loop-pgo.ll b/test/Transforms/LoopUnroll/peel-loop-pgo.ll

index 18309b0691fabbc4b875670406333eeda5ebe1be..a87d5643e7e9dcdf1fd7e618d6dea3f7cb0dd2f6 100644 (file)
--- a/test/Transforms/LoopUnroll/peel-loop-pgo.ll
+++ b/test/Transforms/LoopUnroll/peel-loop-pgo.ll
@@ -3,7 +3,12 @@
  
  ; Make sure we use the profile information correctly to peel-off 3 iterations
  ; from the loop, and update the branch weights for the peeled loop properly.
+
+; CHECK: Loop Unroll: F[basic]
  ; CHECK: PEELING loop %for.body with iteration count 3!
+; CHECK: Loop Unroll: F[optsize]
+; CHECK-NOT: PEELING
+
  ; CHECK-LABEL: @basic
  ; CHECK: br i1 %{{.*}}, label %[[NEXT0:.*]], label %for.cond.for.end_crit_edge, !prof !1
  ; CHECK: [[NEXT0]]:
@@ -37,6 +42,40 @@ for.end:                                          ; preds = %for.cond.for.end_cr
    ret void
  }
  
+; We don't want to peel loops when optimizing for size.
+; CHECK-LABEL: @optsize
+; CHECK: for.body.lr.ph:
+; CHECK-NEXT: br label %for.body
+; CHECK: for.body:
+; CHECK-NOT: br
+; CHECK: br i1 %cmp, label %for.body, label %for.cond.for.end_crit_edge
+define void @optsize(i32* %p, i32 %k) #1 !prof !0 {
+entry:
+  %cmp3 = icmp slt i32 0, %k
+  br i1 %cmp3, label %for.body.lr.ph, label %for.end
+
+for.body.lr.ph:                                   ; preds = %entry
+  br label %for.body
+
+for.body:                                         ; preds = %for.body.lr.ph, %for.body
+  %i.05 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.body ]
+  %p.addr.04 = phi i32* [ %p, %for.body.lr.ph ], [ %incdec.ptr, %for.body ]
+  %incdec.ptr = getelementptr inbounds i32, i32* %p.addr.04, i32 1
+  store i32 %i.05, i32* %p.addr.04, align 4
+  %inc = add nsw i32 %i.05, 1
+  %cmp = icmp slt i32 %inc, %k
+  br i1 %cmp, label %for.body, label %for.cond.for.end_crit_edge, !prof !1
+
+for.cond.for.end_crit_edge:                       ; preds = %for.body
+  br label %for.end
+
+for.end:                                          ; preds = %for.cond.for.end_crit_edge, %entry
+  ret void
+}
+
+attributes #0 = { nounwind }
+attributes #1 = { nounwind optsize }
+
  !0 = !{!"function_entry_count", i64 1}
  !1 = !{!"branch_weights", i32 3001, i32 1001}
author	Michael Kuperstein <mkuper@google.com>
	Wed, 11 Jan 2017 21:42:51 +0000 (21:42 +0000)
committer	Michael Kuperstein <mkuper@google.com>
	Wed, 11 Jan 2017 21:42:51 +0000 (21:42 +0000)