Skip to content

Commit 5bcc82d

Browse files
committed
[LoopPeel] Fix LCSSA phi node invalidation
In the test case, the BECount of the second loop uses %load, but we only have an LCSSA phi node for %add, so that is what gets invalidated. Use the forgetLcssaPhiWithNewPredecessor() API instead, which will invalidate the roots of the expression instead. Fixes #109333.
1 parent c498af7 commit 5bcc82d

File tree

2 files changed

+105
-1
lines changed

2 files changed

+105
-1
lines changed

llvm/lib/Transforms/Utils/LoopPeel.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -859,7 +859,7 @@ static void cloneLoopBlocks(
859859
if (LatchInst && L->contains(LatchInst))
860860
LatchVal = VMap[LatchVal];
861861
PHI.addIncoming(LatchVal, cast<BasicBlock>(VMap[Edge.first]));
862-
SE.forgetValue(&PHI);
862+
SE.forgetLcssaPhiWithNewPredecessor(L, &PHI);
863863
}
864864

865865
// LastValueMap is updated with the values for the current loop
Lines changed: 104 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,104 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2+
; RUN: opt -S -passes="print<scalar-evolution>,loop-unroll" -unroll-runtime < %s 2>/dev/null | FileCheck %s
3+
4+
; Make sure we use %add.lcssa rather than %load when expanding the
5+
; backedge taken count.
6+
7+
define void @test(i1 %c, ptr %p) {
8+
; CHECK-LABEL: define void @test(
9+
; CHECK-SAME: i1 [[C:%.*]], ptr [[P:%.*]]) {
10+
; CHECK-NEXT: [[ENTRY:.*:]]
11+
; CHECK-NEXT: br label %[[LOOP_1_PEEL_BEGIN:.*]]
12+
; CHECK: [[LOOP_1_PEEL_BEGIN]]:
13+
; CHECK-NEXT: br label %[[LOOP_1_PEEL:.*]]
14+
; CHECK: [[LOOP_1_PEEL]]:
15+
; CHECK-NEXT: [[LOAD_PEEL:%.*]] = load i64, ptr [[P]], align 8
16+
; CHECK-NEXT: [[ADD_PEEL:%.*]] = add i64 [[LOAD_PEEL]], 1
17+
; CHECK-NEXT: br i1 [[C]], label %[[IF:.*]], label %[[LOOP_1_PEEL_NEXT:.*]]
18+
; CHECK: [[LOOP_1_PEEL_NEXT]]:
19+
; CHECK-NEXT: br label %[[LOOP_1_PEEL_NEXT1:.*]]
20+
; CHECK: [[LOOP_1_PEEL_NEXT1]]:
21+
; CHECK-NEXT: br label %[[ENTRY_PEEL_NEWPH:.*]]
22+
; CHECK: [[ENTRY_PEEL_NEWPH]]:
23+
; CHECK-NEXT: br label %[[LOOP_1:.*]]
24+
; CHECK: [[LOOP_1]]:
25+
; CHECK-NEXT: [[LOAD:%.*]] = load i64, ptr [[P]], align 8
26+
; CHECK-NEXT: [[ADD:%.*]] = add i64 [[LOAD]], 1
27+
; CHECK-NEXT: br i1 [[C]], label %[[IF_LOOPEXIT:.*]], label %[[LOOP_1]], !llvm.loop [[LOOP0:![0-9]+]]
28+
; CHECK: [[IF_LOOPEXIT]]:
29+
; CHECK-NEXT: [[ADD_LCSSA_PH:%.*]] = phi i64 [ [[ADD]], %[[LOOP_1]] ]
30+
; CHECK-NEXT: br label %[[IF]]
31+
; CHECK: [[IF]]:
32+
; CHECK-NEXT: [[ADD_LCSSA:%.*]] = phi i64 [ [[ADD_PEEL]], %[[LOOP_1_PEEL]] ], [ [[ADD_LCSSA_PH]], %[[IF_LOOPEXIT]] ]
33+
; CHECK-NEXT: [[GEP:%.*]] = getelementptr i64, ptr [[P]], i64 [[ADD_LCSSA]]
34+
; CHECK-NEXT: [[TMP0:%.*]] = shl i64 [[ADD_LCSSA]], 3
35+
; CHECK-NEXT: [[TMP1:%.*]] = lshr i64 [[TMP0]], 3
36+
; CHECK-NEXT: [[TMP2:%.*]] = add nuw nsw i64 [[TMP1]], 1
37+
; CHECK-NEXT: [[XTRAITER:%.*]] = and i64 [[TMP2]], 7
38+
; CHECK-NEXT: [[LCMP_MOD:%.*]] = icmp ne i64 [[XTRAITER]], 0
39+
; CHECK-NEXT: br i1 [[LCMP_MOD]], label %[[LOOP_2_PROL_PREHEADER:.*]], label %[[LOOP_2_PROL_LOOPEXIT:.*]]
40+
; CHECK: [[LOOP_2_PROL_PREHEADER]]:
41+
; CHECK-NEXT: br label %[[LOOP_2_PROL:.*]]
42+
; CHECK: [[LOOP_2_PROL]]:
43+
; CHECK-NEXT: [[IV_PROL:%.*]] = phi ptr [ [[P]], %[[LOOP_2_PROL_PREHEADER]] ], [ [[IV_NEXT_PROL:%.*]], %[[LOOP_2_PROL]] ]
44+
; CHECK-NEXT: [[PROL_ITER:%.*]] = phi i64 [ 0, %[[LOOP_2_PROL_PREHEADER]] ], [ [[PROL_ITER_NEXT:%.*]], %[[LOOP_2_PROL]] ]
45+
; CHECK-NEXT: [[IV_NEXT_PROL]] = getelementptr i8, ptr [[IV_PROL]], i64 8
46+
; CHECK-NEXT: [[ICMP_PROL:%.*]] = icmp eq ptr [[IV_PROL]], [[GEP]]
47+
; CHECK-NEXT: [[PROL_ITER_NEXT]] = add i64 [[PROL_ITER]], 1
48+
; CHECK-NEXT: [[PROL_ITER_CMP:%.*]] = icmp ne i64 [[PROL_ITER_NEXT]], [[XTRAITER]]
49+
; CHECK-NEXT: br i1 [[PROL_ITER_CMP]], label %[[LOOP_2_PROL]], label %[[LOOP_2_PROL_LOOPEXIT_UNR_LCSSA:.*]], !llvm.loop [[LOOP2:![0-9]+]]
50+
; CHECK: [[LOOP_2_PROL_LOOPEXIT_UNR_LCSSA]]:
51+
; CHECK-NEXT: [[IV_UNR_PH:%.*]] = phi ptr [ [[IV_NEXT_PROL]], %[[LOOP_2_PROL]] ]
52+
; CHECK-NEXT: br label %[[LOOP_2_PROL_LOOPEXIT]]
53+
; CHECK: [[LOOP_2_PROL_LOOPEXIT]]:
54+
; CHECK-NEXT: [[IV_UNR:%.*]] = phi ptr [ [[P]], %[[IF]] ], [ [[IV_UNR_PH]], %[[LOOP_2_PROL_LOOPEXIT_UNR_LCSSA]] ]
55+
; CHECK-NEXT: [[TMP3:%.*]] = icmp ult i64 [[TMP1]], 7
56+
; CHECK-NEXT: br i1 [[TMP3]], label %[[EXIT:.*]], label %[[IF_NEW:.*]]
57+
; CHECK: [[IF_NEW]]:
58+
; CHECK-NEXT: br label %[[LOOP_2:.*]]
59+
; CHECK: [[LOOP_2]]:
60+
; CHECK-NEXT: [[IV:%.*]] = phi ptr [ [[IV_UNR]], %[[IF_NEW]] ], [ [[IV_NEXT_7:%.*]], %[[LOOP_2]] ]
61+
; CHECK-NEXT: [[IV_NEXT:%.*]] = getelementptr i8, ptr [[IV]], i64 8
62+
; CHECK-NEXT: [[IV_NEXT_1:%.*]] = getelementptr i8, ptr [[IV_NEXT]], i64 8
63+
; CHECK-NEXT: [[IV_NEXT_2:%.*]] = getelementptr i8, ptr [[IV_NEXT_1]], i64 8
64+
; CHECK-NEXT: [[IV_NEXT_3:%.*]] = getelementptr i8, ptr [[IV_NEXT_2]], i64 8
65+
; CHECK-NEXT: [[IV_NEXT_4:%.*]] = getelementptr i8, ptr [[IV_NEXT_3]], i64 8
66+
; CHECK-NEXT: [[IV_NEXT_5:%.*]] = getelementptr i8, ptr [[IV_NEXT_4]], i64 8
67+
; CHECK-NEXT: [[IV_NEXT_6:%.*]] = getelementptr i8, ptr [[IV_NEXT_5]], i64 8
68+
; CHECK-NEXT: [[IV_NEXT_7]] = getelementptr i8, ptr [[IV_NEXT_6]], i64 8
69+
; CHECK-NEXT: [[ICMP_7:%.*]] = icmp eq ptr [[IV_NEXT_6]], [[GEP]]
70+
; CHECK-NEXT: br i1 [[ICMP_7]], label %[[EXIT_UNR_LCSSA:.*]], label %[[LOOP_2]]
71+
; CHECK: [[EXIT_UNR_LCSSA]]:
72+
; CHECK-NEXT: br label %[[EXIT]]
73+
; CHECK: [[EXIT]]:
74+
; CHECK-NEXT: ret void
75+
;
76+
entry:
77+
br label %loop.1
78+
79+
loop.1:
80+
%phi = phi ptr [ null, %entry ], [ %p, %loop.1 ]
81+
%load = load i64, ptr %p, align 8
82+
%add = add i64 %load, 1
83+
br i1 %c, label %if, label %loop.1
84+
85+
if:
86+
%add.lcssa = phi i64 [ %add, %loop.1 ]
87+
%gep = getelementptr i64, ptr %p, i64 %add.lcssa
88+
br label %loop.2
89+
90+
loop.2:
91+
%iv = phi ptr [ %p, %if ], [ %iv.next, %loop.2 ]
92+
%iv.next = getelementptr i8, ptr %iv, i64 8
93+
%icmp = icmp eq ptr %iv, %gep
94+
br i1 %icmp, label %exit, label %loop.2
95+
96+
exit:
97+
ret void
98+
}
99+
;.
100+
; CHECK: [[LOOP0]] = distinct !{[[LOOP0]], [[META1:![0-9]+]]}
101+
; CHECK: [[META1]] = !{!"llvm.loop.peeled.count", i32 1}
102+
; CHECK: [[LOOP2]] = distinct !{[[LOOP2]], [[META3:![0-9]+]]}
103+
; CHECK: [[META3]] = !{!"llvm.loop.unroll.disable"}
104+
;.

0 commit comments

Comments
 (0)