Skip to content

Commit 94c4952

Browse files
committed
[AArch64] Enable Upper bound unrolling universally
Differential Revision: https://reviews.llvm.org/D105996
1 parent 5b06cba commit 94c4952

File tree

2 files changed

+67
-1
lines changed

2 files changed

+67
-1
lines changed

llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1754,6 +1754,8 @@ void AArch64TTIImpl::getUnrollingPreferences(Loop *L, ScalarEvolution &SE,
17541754
// Enable partial unrolling and runtime unrolling.
17551755
BaseT::getUnrollingPreferences(L, SE, UP, ORE);
17561756

1757+
UP.UpperBound = true;
1758+
17571759
// For inner loop, it is more likely to be a hot one, and the runtime check
17581760
// can be promoted out from LICM pass, so the overhead is less, let's try
17591761
// a larger threshold to unroll more loops.
@@ -1794,7 +1796,6 @@ void AArch64TTIImpl::getUnrollingPreferences(Loop *L, ScalarEvolution &SE,
17941796
!ST->getSchedModel().isOutOfOrder()) {
17951797
UP.Runtime = true;
17961798
UP.Partial = true;
1797-
UP.UpperBound = true;
17981799
UP.UnrollRemainder = true;
17991800
UP.DefaultUnrollRuntimeCount = 4;
18001801

Lines changed: 65 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,65 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2+
; RUN: opt < %s -S -loop-unroll -mtriple aarch64 | FileCheck %s
3+
4+
; Below loop's trip count is not constant and it blocks to unroll the loop.
5+
; After setting up `UP.UpperBound = true` in `getUnrollingPreferences`,
6+
; the loop should be unrolled.
7+
8+
define void @test(i1 %cond) {
9+
; CHECK-LABEL: @test(
10+
; CHECK-NEXT: entry:
11+
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
12+
; CHECK: for.body:
13+
; CHECK-NEXT: switch i32 0, label [[SW_DEFAULT:%.*]] [
14+
; CHECK-NEXT: i32 2, label [[LATCH:%.*]]
15+
; CHECK-NEXT: ]
16+
; CHECK: sw.default:
17+
; CHECK-NEXT: tail call void @foo()
18+
; CHECK-NEXT: br label [[LATCH]]
19+
; CHECK: latch:
20+
; CHECK-NEXT: br i1 false, label [[FOR_END:%.*]], label [[FOR_BODY_1:%.*]]
21+
; CHECK: for.end:
22+
; CHECK-NEXT: ret void
23+
; CHECK: for.body.1:
24+
; CHECK-NEXT: switch i32 1, label [[SW_DEFAULT_1:%.*]] [
25+
; CHECK-NEXT: i32 2, label [[LATCH_1:%.*]]
26+
; CHECK-NEXT: ]
27+
; CHECK: sw.default.1:
28+
; CHECK-NEXT: tail call void @foo()
29+
; CHECK-NEXT: br label [[LATCH_1]]
30+
; CHECK: latch.1:
31+
; CHECK-NEXT: br i1 [[COND:%.*]], label [[FOR_END]], label [[FOR_BODY_2:%.*]]
32+
; CHECK: for.body.2:
33+
; CHECK-NEXT: switch i32 2, label [[SW_DEFAULT_2:%.*]] [
34+
; CHECK-NEXT: i32 2, label [[LATCH_2:%.*]]
35+
; CHECK-NEXT: ]
36+
; CHECK: sw.default.2:
37+
; CHECK-NEXT: tail call void @foo()
38+
; CHECK-NEXT: br label [[LATCH_2]]
39+
; CHECK: latch.2:
40+
; CHECK-NEXT: br label [[FOR_END]]
41+
;
42+
entry:
43+
%0 = select i1 %cond, i32 2, i32 3
44+
br label %for.body
45+
46+
for.body:
47+
%i.017 = phi i32 [ 0, %entry ], [ %inc, %latch ]
48+
switch i32 %i.017, label %sw.default [
49+
i32 2, label %latch
50+
]
51+
52+
sw.default:
53+
tail call void @foo()
54+
br label %latch
55+
56+
latch:
57+
%inc = add nuw nsw i32 %i.017, 1
58+
%exitcond.not = icmp eq i32 %inc, %0
59+
br i1 %exitcond.not, label %for.end, label %for.body
60+
61+
for.end:
62+
ret void
63+
}
64+
65+
declare void @foo()

0 commit comments

Comments
 (0)