| ; RUN: opt < %s -S -loop-unroll -unroll-count=4 | FileCheck -check-prefix=CHECK_COUNT4 %s | |
| ; RUN: opt < %s -S -loop-unroll | FileCheck -check-prefix=CHECK_NOCOUNT %s | |
| ; RUN: opt < %s -S -passes='require<profile-summary>,function(unroll)' -pgso | FileCheck -check-prefix=PGSO %s | |
| ; RUN: opt < %s -S -passes='require<profile-summary>,function(unroll)' -pgso=false | FileCheck -check-prefix=NPGSO %s | |
| ;///////////////////// TEST 1 ////////////////////////////// | |
| ; This test shows that the loop is unrolled according to the specified | |
| ; unroll factor. | |
| define void @Test1() nounwind { | |
| entry: | |
| br label %loop | |
| loop: | |
| %iv = phi i32 [ 0, %entry ], [ %inc, %loop ] | |
| %inc = add i32 %iv, 1 | |
| %exitcnd = icmp uge i32 %inc, 1024 | |
| br i1 %exitcnd, label %exit, label %loop | |
| exit: | |
| ret void | |
| } | |
| ; CHECK_COUNT4-LABEL: @Test1 | |
| ; CHECK_COUNT4: phi | |
| ; CHECK_COUNT4-NEXT: add | |
| ; CHECK_COUNT4-NEXT: add | |
| ; CHECK_COUNT4-NEXT: add | |
| ; CHECK_COUNT4-NEXT: add | |
| ; CHECK_COUNT4-NEXT: icmp | |
| ;///////////////////// TEST 2 ////////////////////////////// | |
| ; This test shows that with optnone attribute, the loop is not unrolled | |
| ; even if an unroll factor was specified. | |
| define void @Test2() nounwind optnone noinline { | |
| entry: | |
| br label %loop | |
| loop: | |
| %iv = phi i32 [ 0, %entry ], [ %inc, %loop ] | |
| %inc = add i32 %iv, 1 | |
| %exitcnd = icmp uge i32 %inc, 1024 | |
| br i1 %exitcnd, label %exit, label %loop | |
| exit: | |
| ret void | |
| } | |
| ; CHECK_COUNT4-LABEL: @Test2 | |
| ; CHECK_COUNT4: phi | |
| ; CHECK_COUNT4-NEXT: add | |
| ; CHECK_COUNT4-NEXT: icmp | |
| ;///////////////////// TEST 3 ////////////////////////////// | |
| ; This test shows that this loop is fully unrolled by default. | |
| @tab = common global [24 x i32] zeroinitializer, align 4 | |
| define i32 @Test3() { | |
| entry: | |
| br label %for.body | |
| for.body: ; preds = %for.body, %entry | |
| %i.05 = phi i32 [ 0, %entry ], [ %inc, %for.body ] | |
| %arrayidx = getelementptr inbounds [24 x i32], [24 x i32]* @tab, i32 0, i32 %i.05 | |
| store i32 %i.05, i32* %arrayidx, align 4 | |
| %inc = add nuw nsw i32 %i.05, 1 | |
| %exitcond = icmp eq i32 %inc, 24 | |
| br i1 %exitcond, label %for.end, label %for.body | |
| for.end: ; preds = %for.body | |
| ret i32 42 | |
| } | |
| ; CHECK_NOCOUNT-LABEL: @Test3 | |
| ; CHECK_NOCOUNT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: store | |
| ; CHECK_NOCOUNT-NEXT: ret | |
| ;///////////////////// TEST 4 ////////////////////////////// | |
| ; This test shows that with optsize attribute, this loop is not unrolled. | |
| define i32 @Test4() optsize { | |
| entry: | |
| br label %for.body | |
| for.body: ; preds = %for.body, %entry | |
| %i.05 = phi i32 [ 0, %entry ], [ %inc, %for.body ] | |
| %arrayidx = getelementptr inbounds [24 x i32], [24 x i32]* @tab, i32 0, i32 %i.05 | |
| store i32 %i.05, i32* %arrayidx, align 4 | |
| %inc = add nuw nsw i32 %i.05, 1 | |
| %exitcond = icmp eq i32 %inc, 24 | |
| br i1 %exitcond, label %for.end, label %for.body | |
| for.end: ; preds = %for.body | |
| ret i32 42 | |
| } | |
| ; CHECK_NOCOUNT-LABEL: @Test4 | |
| ; CHECK_NOCOUNT: phi | |
| ; CHECK_NOCOUNT: icmp | |
| ;///////////////////// TEST 5 ////////////////////////////// | |
| ; This test shows that with PGO, this loop is cold and not unrolled. | |
| define i32 @Test5() !prof !14 { | |
| entry: | |
| br label %for.body | |
| for.body: ; preds = %for.body, %entry | |
| %i.05 = phi i32 [ 0, %entry ], [ %inc, %for.body ] | |
| %arrayidx = getelementptr inbounds [24 x i32], [24 x i32]* @tab, i32 0, i32 %i.05 | |
| store i32 %i.05, i32* %arrayidx, align 4 | |
| %inc = add nuw nsw i32 %i.05, 1 | |
| %exitcond = icmp eq i32 %inc, 24 | |
| br i1 %exitcond, label %for.end, label %for.body | |
| for.end: ; preds = %for.body | |
| ret i32 42 | |
| } | |
| ; PGSO-LABEL: @Test5 | |
| ; PGSO: phi | |
| ; PGSO: icmp | |
| ; NPGSO-LABEL: @Test5 | |
| ; NPGSO-NOT: phi | |
| ; NPGSO-NOT: icmp | |
| !llvm.module.flags = !{!0} | |
| !0 = !{i32 1, !"ProfileSummary", !1} | |
| !1 = !{!2, !3, !4, !5, !6, !7, !8, !9} | |
| !2 = !{!"ProfileFormat", !"InstrProf"} | |
| !3 = !{!"TotalCount", i64 10000} | |
| !4 = !{!"MaxCount", i64 10} | |
| !5 = !{!"MaxInternalCount", i64 1} | |
| !6 = !{!"MaxFunctionCount", i64 1000} | |
| !7 = !{!"NumCounts", i64 3} | |
| !8 = !{!"NumFunctions", i64 3} | |
| !9 = !{!"DetailedSummary", !10} | |
| !10 = !{!11, !12, !13} | |
| !11 = !{i32 10000, i64 100, i32 1} | |
| !12 = !{i32 999000, i64 100, i32 1} | |
| !13 = !{i32 999999, i64 1, i32 2} | |
| !14 = !{!"function_entry_count", i64 0} |