Skip to content

Commit 9f77e96

Browse files
nikictru
authored andcommitted
[GVN] Invalidate MDA when deduplicating phi nodes
Duplicate phi nodes were being directly removed, without invalidating MDA. This could result in a new phi node being allocated at the same address, incorrectly reusing a cache entry. Fix this by optionally allowing EliminateDuplicatePHINodes() to collect phi nodes to remove into a vector, which allows GVN to handle removal itself. Fixes llvm#64598. Differential Revision: https://reviews.llvm.org/D158849 (cherry picked from commit 7c229f6)
1 parent a13a894 commit 9f77e96

File tree

4 files changed

+141
-8
lines changed

4 files changed

+141
-8
lines changed

llvm/include/llvm/Transforms/Utils/Local.h

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -162,8 +162,18 @@ bool TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB,
162162
/// Check for and eliminate duplicate PHI nodes in this block. This doesn't try
163163
/// to be clever about PHI nodes which differ only in the order of the incoming
164164
/// values, but instcombine orders them so it usually won't matter.
165+
///
166+
/// This overload removes the duplicate PHI nodes directly.
165167
bool EliminateDuplicatePHINodes(BasicBlock *BB);
166168

169+
/// Check for and eliminate duplicate PHI nodes in this block. This doesn't try
170+
/// to be clever about PHI nodes which differ only in the order of the incoming
171+
/// values, but instcombine orders them so it usually won't matter.
172+
///
173+
/// This overload collects the PHI nodes to be removed into the ToRemove set.
174+
bool EliminateDuplicatePHINodes(BasicBlock *BB,
175+
SmallPtrSetImpl<PHINode *> &ToRemove);
176+
167177
/// This function is used to do simplification of a CFG. For example, it
168178
/// adjusts branches to branches to eliminate the extra hop, it eliminates
169179
/// unreachable basic blocks, and does other peephole optimization of the CFG.

llvm/lib/Transforms/Scalar/GVN.cpp

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2778,7 +2778,10 @@ bool GVNPass::processBlock(BasicBlock *BB) {
27782778
// use our normal hash approach for phis. Instead, simply look for
27792779
// obvious duplicates. The first pass of GVN will tend to create
27802780
// identical phis, and the second or later passes can eliminate them.
2781-
ChangedFunction |= EliminateDuplicatePHINodes(BB);
2781+
SmallPtrSet<PHINode *, 8> PHINodesToRemove;
2782+
ChangedFunction |= EliminateDuplicatePHINodes(BB, PHINodesToRemove);
2783+
for (PHINode *PN : PHINodesToRemove)
2784+
removeInstruction(PN);
27822785

27832786
for (BasicBlock::iterator BI = BB->begin(), BE = BB->end();
27842787
BI != BE;) {

llvm/lib/Transforms/Utils/Local.cpp

Lines changed: 24 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -1247,7 +1247,9 @@ bool llvm::TryToSimplifyUncondBranchFromEmptyBlock(BasicBlock *BB,
12471247
return true;
12481248
}
12491249

1250-
static bool EliminateDuplicatePHINodesNaiveImpl(BasicBlock *BB) {
1250+
static bool
1251+
EliminateDuplicatePHINodesNaiveImpl(BasicBlock *BB,
1252+
SmallPtrSetImpl<PHINode *> &ToRemove) {
12511253
// This implementation doesn't currently consider undef operands
12521254
// specially. Theoretically, two phis which are identical except for
12531255
// one having an undef where the other doesn't could be collapsed.
@@ -1263,12 +1265,14 @@ static bool EliminateDuplicatePHINodesNaiveImpl(BasicBlock *BB) {
12631265
// Note that we only look in the upper square's triangle,
12641266
// we already checked that the lower triangle PHI's aren't identical.
12651267
for (auto J = I; PHINode *DuplicatePN = dyn_cast<PHINode>(J); ++J) {
1268+
if (ToRemove.contains(DuplicatePN))
1269+
continue;
12661270
if (!DuplicatePN->isIdenticalToWhenDefined(PN))
12671271
continue;
12681272
// A duplicate. Replace this PHI with the base PHI.
12691273
++NumPHICSEs;
12701274
DuplicatePN->replaceAllUsesWith(PN);
1271-
DuplicatePN->eraseFromParent();
1275+
ToRemove.insert(DuplicatePN);
12721276
Changed = true;
12731277

12741278
// The RAUW can change PHIs that we already visited.
@@ -1279,7 +1283,9 @@ static bool EliminateDuplicatePHINodesNaiveImpl(BasicBlock *BB) {
12791283
return Changed;
12801284
}
12811285

1282-
static bool EliminateDuplicatePHINodesSetBasedImpl(BasicBlock *BB) {
1286+
static bool
1287+
EliminateDuplicatePHINodesSetBasedImpl(BasicBlock *BB,
1288+
SmallPtrSetImpl<PHINode *> &ToRemove) {
12831289
// This implementation doesn't currently consider undef operands
12841290
// specially. Theoretically, two phis which are identical except for
12851291
// one having an undef where the other doesn't could be collapsed.
@@ -1343,12 +1349,14 @@ static bool EliminateDuplicatePHINodesSetBasedImpl(BasicBlock *BB) {
13431349
// Examine each PHI.
13441350
bool Changed = false;
13451351
for (auto I = BB->begin(); PHINode *PN = dyn_cast<PHINode>(I++);) {
1352+
if (ToRemove.contains(PN))
1353+
continue;
13461354
auto Inserted = PHISet.insert(PN);
13471355
if (!Inserted.second) {
13481356
// A duplicate. Replace this PHI with its duplicate.
13491357
++NumPHICSEs;
13501358
PN->replaceAllUsesWith(*Inserted.first);
1351-
PN->eraseFromParent();
1359+
ToRemove.insert(PN);
13521360
Changed = true;
13531361

13541362
// The RAUW can change PHIs that we already visited. Start over from the
@@ -1361,14 +1369,23 @@ static bool EliminateDuplicatePHINodesSetBasedImpl(BasicBlock *BB) {
13611369
return Changed;
13621370
}
13631371

1364-
bool llvm::EliminateDuplicatePHINodes(BasicBlock *BB) {
1372+
bool llvm::EliminateDuplicatePHINodes(BasicBlock *BB,
1373+
SmallPtrSetImpl<PHINode *> &ToRemove) {
13651374
if (
13661375
#ifndef NDEBUG
13671376
!PHICSEDebugHash &&
13681377
#endif
13691378
hasNItemsOrLess(BB->phis(), PHICSENumPHISmallSize))
1370-
return EliminateDuplicatePHINodesNaiveImpl(BB);
1371-
return EliminateDuplicatePHINodesSetBasedImpl(BB);
1379+
return EliminateDuplicatePHINodesNaiveImpl(BB, ToRemove);
1380+
return EliminateDuplicatePHINodesSetBasedImpl(BB, ToRemove);
1381+
}
1382+
1383+
bool llvm::EliminateDuplicatePHINodes(BasicBlock *BB) {
1384+
SmallPtrSet<PHINode *, 8> ToRemove;
1385+
bool Changed = EliminateDuplicatePHINodes(BB, ToRemove);
1386+
for (PHINode *PN : ToRemove)
1387+
PN->eraseFromParent();
1388+
return Changed;
13721389
}
13731390

13741391
/// If the specified pointer points to an object that we control, try to modify

llvm/test/Transforms/GVN/pr64598.ll

Lines changed: 103 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,103 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
2+
; RUN: opt -S -passes=gvn < %s | FileCheck %s
3+
4+
define i32 @main(i64 %x, ptr %d, ptr noalias %p) {
5+
; CHECK-LABEL: define i32 @main
6+
; CHECK-SAME: (i64 [[X:%.*]], ptr [[D:%.*]], ptr noalias [[P:%.*]]) {
7+
; CHECK-NEXT: entry:
8+
; CHECK-NEXT: [[T1_PRE_PRE_PRE:%.*]] = load ptr, ptr [[P]], align 8
9+
; CHECK-NEXT: [[T2_PRE_PRE_PRE:%.*]] = load ptr, ptr [[T1_PRE_PRE_PRE]], align 8, !tbaa [[TBAA0:![0-9]+]]
10+
; CHECK-NEXT: [[T3_PRE_PRE_PRE:%.*]] = load ptr, ptr [[T2_PRE_PRE_PRE]], align 8
11+
; CHECK-NEXT: br label [[LOOP:%.*]]
12+
; CHECK: loop:
13+
; CHECK-NEXT: [[T2_PRE_PRE:%.*]] = phi ptr [ [[T2_PRE_PRE23:%.*]], [[LOOP_LATCH:%.*]] ], [ [[T2_PRE_PRE_PRE]], [[ENTRY:%.*]] ]
14+
; CHECK-NEXT: [[T1_PRE_PRE:%.*]] = phi ptr [ [[T1_PRE_PRE19:%.*]], [[LOOP_LATCH]] ], [ [[T1_PRE_PRE_PRE]], [[ENTRY]] ]
15+
; CHECK-NEXT: br label [[LOOP2:%.*]]
16+
; CHECK: loop2:
17+
; CHECK-NEXT: [[T2_PRE_PRE25:%.*]] = phi ptr [ [[T2_PRE_PRE23]], [[LOOP2_LATCH_LOOP2_CRIT_EDGE:%.*]] ], [ [[T2_PRE_PRE]], [[LOOP]] ]
18+
; CHECK-NEXT: [[T1_PRE_PRE21:%.*]] = phi ptr [ [[T1_PRE_PRE19]], [[LOOP2_LATCH_LOOP2_CRIT_EDGE]] ], [ [[T1_PRE_PRE]], [[LOOP]] ]
19+
; CHECK-NEXT: [[T3_PRE:%.*]] = phi ptr [ [[T3_PRE16:%.*]], [[LOOP2_LATCH_LOOP2_CRIT_EDGE]] ], [ [[T3_PRE_PRE_PRE]], [[LOOP]] ]
20+
; CHECK-NEXT: [[T2_PRE:%.*]] = phi ptr [ [[T2_PRE13:%.*]], [[LOOP2_LATCH_LOOP2_CRIT_EDGE]] ], [ [[T2_PRE_PRE]], [[LOOP]] ]
21+
; CHECK-NEXT: [[T1_PRE:%.*]] = phi ptr [ [[T1_PRE10:%.*]], [[LOOP2_LATCH_LOOP2_CRIT_EDGE]] ], [ [[T1_PRE_PRE]], [[LOOP]] ]
22+
; CHECK-NEXT: br label [[LOOP3:%.*]]
23+
; CHECK: loop3:
24+
; CHECK-NEXT: [[T2_PRE_PRE24:%.*]] = phi ptr [ [[T2_PRE_PRE23]], [[LOOP3_LATCH:%.*]] ], [ [[T2_PRE_PRE25]], [[LOOP2]] ]
25+
; CHECK-NEXT: [[T1_PRE_PRE20:%.*]] = phi ptr [ [[T1_PRE_PRE19]], [[LOOP3_LATCH]] ], [ [[T1_PRE_PRE21]], [[LOOP2]] ]
26+
; CHECK-NEXT: [[T3_PRE17:%.*]] = phi ptr [ [[T3_PRE16]], [[LOOP3_LATCH]] ], [ [[T3_PRE]], [[LOOP2]] ]
27+
; CHECK-NEXT: [[T2_PRE14:%.*]] = phi ptr [ [[T2_PRE13]], [[LOOP3_LATCH]] ], [ [[T2_PRE]], [[LOOP2]] ]
28+
; CHECK-NEXT: [[T1_PRE11:%.*]] = phi ptr [ [[T1_PRE10]], [[LOOP3_LATCH]] ], [ [[T1_PRE]], [[LOOP2]] ]
29+
; CHECK-NEXT: [[T78:%.*]] = phi ptr [ [[T7:%.*]], [[LOOP3_LATCH]] ], [ [[T3_PRE]], [[LOOP2]] ]
30+
; CHECK-NEXT: [[T66:%.*]] = phi ptr [ [[T6:%.*]], [[LOOP3_LATCH]] ], [ [[T2_PRE]], [[LOOP2]] ]
31+
; CHECK-NEXT: [[T54:%.*]] = phi ptr [ [[T5:%.*]], [[LOOP3_LATCH]] ], [ [[T1_PRE]], [[LOOP2]] ]
32+
; CHECK-NEXT: [[TOBOOL_NOT2_I:%.*]] = icmp eq i64 [[X]], 0
33+
; CHECK-NEXT: br i1 false, label [[LOOP3_LOOP3_LATCH_CRIT_EDGE:%.*]], label [[FOR_BODY_LR_PH_I:%.*]]
34+
; CHECK: loop3.loop3.latch_crit_edge:
35+
; CHECK-NEXT: br label [[LOOP3_LATCH]]
36+
; CHECK: for.body.lr.ph.i:
37+
; CHECK-NEXT: store i32 0, ptr [[P]], align 4
38+
; CHECK-NEXT: [[T5_PRE:%.*]] = load ptr, ptr [[P]], align 8
39+
; CHECK-NEXT: [[T6_PRE:%.*]] = load ptr, ptr [[T5_PRE]], align 8, !tbaa [[TBAA0]]
40+
; CHECK-NEXT: [[T7_PRE:%.*]] = load ptr, ptr [[T6_PRE]], align 8
41+
; CHECK-NEXT: br label [[LOOP3_LATCH]]
42+
; CHECK: loop3.latch:
43+
; CHECK-NEXT: [[T2_PRE_PRE23]] = phi ptr [ [[T2_PRE_PRE24]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T6_PRE]], [[FOR_BODY_LR_PH_I]] ]
44+
; CHECK-NEXT: [[T1_PRE_PRE19]] = phi ptr [ [[T1_PRE_PRE20]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T5_PRE]], [[FOR_BODY_LR_PH_I]] ]
45+
; CHECK-NEXT: [[T3_PRE16]] = phi ptr [ [[T3_PRE17]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T7_PRE]], [[FOR_BODY_LR_PH_I]] ]
46+
; CHECK-NEXT: [[T2_PRE13]] = phi ptr [ [[T2_PRE14]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T6_PRE]], [[FOR_BODY_LR_PH_I]] ]
47+
; CHECK-NEXT: [[T1_PRE10]] = phi ptr [ [[T1_PRE11]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T5_PRE]], [[FOR_BODY_LR_PH_I]] ]
48+
; CHECK-NEXT: [[T7]] = phi ptr [ [[T78]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T7_PRE]], [[FOR_BODY_LR_PH_I]] ]
49+
; CHECK-NEXT: [[T6]] = phi ptr [ [[T66]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T6_PRE]], [[FOR_BODY_LR_PH_I]] ]
50+
; CHECK-NEXT: [[T5]] = phi ptr [ [[T54]], [[LOOP3_LOOP3_LATCH_CRIT_EDGE]] ], [ [[T5_PRE]], [[FOR_BODY_LR_PH_I]] ]
51+
; CHECK-NEXT: br i1 false, label [[LOOP2_LATCH:%.*]], label [[LOOP3]]
52+
; CHECK: loop2.latch:
53+
; CHECK-NEXT: br i1 false, label [[LOOP2_LATCH_LOOP2_CRIT_EDGE]], label [[LOOP_LATCH]]
54+
; CHECK: loop2.latch.loop2_crit_edge:
55+
; CHECK-NEXT: br label [[LOOP2]]
56+
; CHECK: loop.latch:
57+
; CHECK-NEXT: store i32 0, ptr [[D]], align 4, !tbaa [[TBAA4:![0-9]+]]
58+
; CHECK-NEXT: br label [[LOOP]]
59+
;
60+
entry:
61+
br label %loop
62+
63+
loop:
64+
br label %loop2
65+
66+
loop2:
67+
br label %loop3
68+
69+
loop3:
70+
%t1 = load ptr, ptr %p, align 8
71+
%t2 = load ptr, ptr %t1, align 8, !tbaa !0
72+
%t3 = load ptr, ptr %t2, align 8
73+
%t4 = load i8, ptr %t3, align 1
74+
%tobool.not2.i = icmp eq i64 %x, 0
75+
br i1 false, label %loop3.latch, label %for.body.lr.ph.i
76+
77+
for.body.lr.ph.i:
78+
store i32 0, ptr %p, align 4
79+
br label %w.exit.loopexit
80+
81+
w.exit.loopexit:
82+
br label %loop3.latch
83+
84+
loop3.latch:
85+
%t5 = load ptr, ptr %p, align 8
86+
%t6 = load ptr, ptr %t5, align 8, !tbaa !0
87+
%t7 = load ptr, ptr %t6, align 8
88+
br i1 false, label %loop2.latch, label %loop3
89+
90+
loop2.latch:
91+
br i1 false, label %loop2, label %loop.latch
92+
93+
loop.latch:
94+
store i32 0, ptr %d, align 4, !tbaa !4
95+
br label %loop
96+
}
97+
98+
!0 = !{!1, !1, i64 0}
99+
!1 = !{!"any pointer", !2, i64 0}
100+
!2 = !{!"omnipotent char", !3, i64 0}
101+
!3 = !{!"Simple C/C++ TBAA"}
102+
!4 = !{!5, !5, i64 0}
103+
!5 = !{!"int", !2, i64 0}

0 commit comments

Comments
 (0)