Skip to content

Commit 1fbdbb5

Browse files
committed
Revert "Recommit "[SCEV] Look through single value PHIs." (take 2)"
This reverts commit 764d9aa. This patch exposed a few additional cases where SCEV expressions are not properly invalidated. See PR52024, PR52023.
1 parent d81723c commit 1fbdbb5

File tree

8 files changed

+72
-60
lines changed

8 files changed

+72
-60
lines changed

llvm/lib/Analysis/ScalarEvolution.cpp

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5631,8 +5631,13 @@ const SCEV *ScalarEvolution::createNodeForPHI(PHINode *PN) {
56315631
if (const SCEV *S = createNodeFromSelectLikePHI(PN))
56325632
return S;
56335633

5634+
// If the PHI has a single incoming value, follow that value, unless the
5635+
// PHI's incoming blocks are in a different loop, in which case doing so
5636+
// risks breaking LCSSA form. Instcombine would normally zap these, but
5637+
// it doesn't have DominatorTree information, so it may miss cases.
56345638
if (Value *V = SimplifyInstruction(PN, {getDataLayout(), &TLI, &DT, &AC}))
5635-
return getSCEV(V);
5639+
if (LI.replacementPreservesLCSSAForm(PN, V))
5640+
return getSCEV(V);
56365641

56375642
// If it's not a loop phi, we can't handle it yet.
56385643
return getUnknown(PN);

llvm/test/Analysis/DependenceAnalysis/lcssa.ll

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
; RUN: "-aa-pipeline=basic-aa,tbaa" 2>&1 | FileCheck %s
33

44
; CHECK: Src: %v = load i32, i32* %arrayidx1, align 4 --> Dst: store i32 %add, i32* %a.lcssa, align 4
5-
; CHECK-NEXT: da analyze - anti [*|<]!
5+
; CHECK-NEXT: da analyze - confused!
66

77
define void @f(i32 *%a, i32 %n, i64 %n2) {
88
entry:

llvm/test/Analysis/ScalarEvolution/cycled_phis.ll

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -46,7 +46,7 @@ define void @test_02(i32* %p, i32* %q) {
4646
; CHECK-NEXT: %inner_cond = call i1 @cond()
4747
; CHECK-NEXT: --> %inner_cond U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %inner_loop: Variant, %outer_loop: Variant }
4848
; CHECK-NEXT: %inner_lcssa = phi i32 [ %inner_phi, %inner_loop ]
49-
; CHECK-NEXT: --> %inner_phi U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %outer_loop: Variant, %inner_loop: Variant }
49+
; CHECK-NEXT: --> %inner_lcssa U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %outer_loop: Variant, %inner_loop: Invariant }
5050
; CHECK-NEXT: %outer_cond = call i1 @cond()
5151
; CHECK-NEXT: --> %outer_cond U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %outer_loop: Variant, %inner_loop: Invariant }
5252
; CHECK-NEXT: Determining loop execution counts for: @test_02
@@ -97,7 +97,7 @@ define void @test_03(i32* %p, i32* %q) {
9797
; CHECK-NEXT: %inner_cond = call i1 @cond()
9898
; CHECK-NEXT: --> %inner_cond U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %inner_loop: Variant, %outer_loop: Variant }
9999
; CHECK-NEXT: %inner_lcssa = phi i32 [ %inner_phi_1, %inner_loop ]
100-
; CHECK-NEXT: --> %inner_phi_1 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %outer_loop: Variant, %inner_loop: Variant }
100+
; CHECK-NEXT: --> %inner_lcssa U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %outer_loop: Variant, %inner_loop: Invariant }
101101
; CHECK-NEXT: %outer_cond = call i1 @cond()
102102
; CHECK-NEXT: --> %outer_cond U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %outer_loop: Variant, %inner_loop: Invariant }
103103
; CHECK-NEXT: Determining loop execution counts for: @test_03

llvm/test/Analysis/ScalarEvolution/incorrect-exit-count.ll

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ define dso_local i32 @f() {
5353
; CHECK-NEXT: %dec.3 = add nsw i32 %storemerge1921.3, -1
5454
; CHECK-NEXT: --> {2,+,-1}<nsw><%inner.loop> U: [2,3) S: [2,3) Exits: <<Unknown>> LoopDispositions: { %inner.loop: Computable, %outer.loop: Variant }
5555
; CHECK-NEXT: %storemerge1921.lcssa25.3 = phi i32 [ %storemerge1921.3, %for.end.3 ]
56-
; CHECK-NEXT: --> {3,+,-1}<nuw><nsw><%inner.loop> U: [3,4) S: [3,4) Exits: <<Unknown>> LoopDispositions: { %outer.loop: Variant, %for.cond6: Variant, %inner.loop: Computable }
56+
; CHECK-NEXT: --> %storemerge1921.lcssa25.3 U: [3,4) S: [3,4) Exits: <<Unknown>> LoopDispositions: { %outer.loop: Variant, %for.cond6: Invariant, %inner.loop: Invariant }
5757
; CHECK-NEXT: %dec16 = add nsw i32 %storemerge23, -1
5858
; CHECK-NEXT: --> {2,+,-1}<nsw><%outer.loop> U: [0,3) S: [0,3) Exits: <<Unknown>> LoopDispositions: { %outer.loop: Computable, %for.cond6: Invariant, %inner.loop: Invariant }
5959
; CHECK-NEXT: Determining loop execution counts for: @f

llvm/test/Analysis/ScalarEvolution/solve-quadratic-i1.ll

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -59,9 +59,9 @@ define void @f1() #0 {
5959
; CHECK-NEXT: %v6 = add nuw nsw i32 %v1, 1
6060
; CHECK-NEXT: --> {4,+,1}<nuw><nsw><%b1> U: [4,7) S: [4,7) Exits: 6 LoopDispositions: { %b1: Computable }
6161
; CHECK-NEXT: %v7 = phi i32 [ %v1, %b1 ]
62-
; CHECK-NEXT: --> {3,+,1}<nuw><nsw><%b1> U: [3,6) S: [3,6) --> 5 U: [5,6) S: [5,6)
62+
; CHECK-NEXT: --> %v7 U: [3,6) S: [3,6) --> 5 U: [5,6) S: [5,6)
6363
; CHECK-NEXT: %v8 = phi i16 [ %v3, %b1 ]
64-
; CHECK-NEXT: --> {3,+,4,+,1}<%b1> U: full-set S: full-set --> 12 U: [12,13) S: [12,13)
64+
; CHECK-NEXT: --> %v8 U: full-set S: full-set --> 12 U: [12,13) S: [12,13)
6565
; CHECK-NEXT: Determining loop execution counts for: @f1
6666
; CHECK-NEXT: Loop %b3: <multiple exits> Unpredictable backedge-taken count.
6767
; CHECK-NEXT: Loop %b3: Unpredictable max backedge-taken count.

llvm/test/Analysis/ScalarEvolution/solve-quadratic-overflow.ll

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -12,11 +12,11 @@
1212
; CHECK-NEXT: %v3 = mul i16 %v2, %v2
1313
; CHECK-NEXT: --> {1,+,3,+,2}<%b1> U: full-set S: full-set Exits: 0 LoopDispositions: { %b1: Computable }
1414
; CHECK-NEXT: %v5 = phi i16 [ %v2, %b1 ]
15-
; CHECK-NEXT: --> {-1,+,-1}<%b1> U: [-256,0) S: [-256,0) --> -256 U: [-256,-255) S: [-256,-255)
15+
; CHECK-NEXT: --> %v5 U: [-256,0) S: [-256,0)
1616
; CHECK-NEXT: %v6 = phi i16 [ %v3, %b1 ]
17-
; CHECK-NEXT: --> {1,+,3,+,2}<%b1> U: full-set S: full-set --> 0 U: [0,1) S: [0,1)
17+
; CHECK-NEXT: --> %v6 U: full-set S: full-set
1818
; CHECK-NEXT: %v7 = sext i16 %v5 to i32
19-
; CHECK-NEXT: --> {-1,+,-1}<nsw><%b1> U: [-256,0) S: [-256,0) --> -256 U: [-256,-255) S: [-256,-255)
19+
; CHECK-NEXT: --> (sext i16 %v5 to i32) U: [-256,0) S: [-256,0)
2020
; CHECK-NEXT: Determining loop execution counts for: @f0
2121
; CHECK-NEXT: Loop %b1: backedge-taken count is 255
2222
; CHECK-NEXT: Loop %b1: max backedge-taken count is 255

llvm/test/Transforms/LoopStrengthReduce/funclet.ll

Lines changed: 24 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -15,21 +15,23 @@ define void @f() personality i32 (...)* @_except_handler3 {
1515
; CHECK-NEXT: entry:
1616
; CHECK-NEXT: br label [[THROW:%.*]]
1717
; CHECK: throw:
18+
; CHECK-NEXT: [[TMP96:%.*]] = getelementptr inbounds i8, i8* undef, i32 1
1819
; CHECK-NEXT: invoke void @reserve()
1920
; CHECK-NEXT: to label [[THROW]] unwind label [[PAD:%.*]]
2021
; CHECK: pad:
22+
; CHECK-NEXT: [[PHI2:%.*]] = phi i8* [ [[TMP96]], [[THROW]] ]
2123
; CHECK-NEXT: [[CS:%.*]] = catchswitch within none [label %unreachable] unwind label [[BLAH2:%.*]]
2224
; CHECK: unreachable:
2325
; CHECK-NEXT: [[TMP0:%.*]] = catchpad within [[CS]] []
2426
; CHECK-NEXT: unreachable
2527
; CHECK: blah2:
2628
; CHECK-NEXT: [[CLEANUPPADI4_I_I_I:%.*]] = cleanuppad within none []
29+
; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, i8* [[PHI2]], i32 -1
2730
; CHECK-NEXT: br label [[LOOP_BODY:%.*]]
2831
; CHECK: loop_body:
29-
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i32 [ [[LSR_IV_NEXT:%.*]], [[ITER:%.*]] ], [ 0, [[BLAH2]] ]
30-
; CHECK-NEXT: [[LSR_IV_NEXT]] = add nuw nsw i32 [[LSR_IV]], -1
31-
; CHECK-NEXT: [[LSR_IV_NEXT1:%.*]] = inttoptr i32 [[LSR_IV_NEXT]] to i8*
32-
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[LSR_IV_NEXT1]], null
32+
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i8* [ [[SCEVGEP1:%.*]], [[ITER:%.*]] ], [ [[SCEVGEP]], [[BLAH2]] ]
33+
; CHECK-NEXT: [[SCEVGEP1]] = getelementptr i8, i8* [[LSR_IV]], i32 1
34+
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[SCEVGEP1]], undef
3335
; CHECK-NEXT: br i1 [[TMP100]], label [[UNWIND_OUT:%.*]], label [[ITER]]
3436
; CHECK: iter:
3537
; CHECK-NEXT: br i1 true, label [[UNWIND_OUT]], label [[LOOP_BODY]]
@@ -74,25 +76,27 @@ define void @g() personality i32 (...)* @_except_handler3 {
7476
; CHECK-NEXT: entry:
7577
; CHECK-NEXT: br label [[THROW:%.*]]
7678
; CHECK: throw:
79+
; CHECK-NEXT: [[TMP96:%.*]] = getelementptr inbounds i8, i8* undef, i32 1
7780
; CHECK-NEXT: invoke void @reserve()
7881
; CHECK-NEXT: to label [[THROW]] unwind label [[PAD:%.*]]
7982
; CHECK: pad:
83+
; CHECK-NEXT: [[PHI2:%.*]] = phi i8* [ [[TMP96]], [[THROW]] ]
8084
; CHECK-NEXT: [[CS:%.*]] = catchswitch within none [label [[UNREACHABLE:%.*]], label %blah] unwind to caller
8185
; CHECK: unreachable:
8286
; CHECK-NEXT: [[TMP0:%.*]] = catchpad within [[CS]] []
8387
; CHECK-NEXT: unreachable
8488
; CHECK: blah:
8589
; CHECK-NEXT: [[CATCHPAD:%.*]] = catchpad within [[CS]] []
90+
; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, i8* [[PHI2]], i32 -1
8691
; CHECK-NEXT: br label [[LOOP_BODY:%.*]]
8792
; CHECK: unwind_out:
8893
; CHECK-NEXT: catchret from [[CATCHPAD]] to label [[LEAVE:%.*]]
8994
; CHECK: leave:
9095
; CHECK-NEXT: ret void
9196
; CHECK: loop_body:
92-
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i32 [ [[LSR_IV_NEXT:%.*]], [[ITER:%.*]] ], [ 0, [[BLAH:%.*]] ]
93-
; CHECK-NEXT: [[LSR_IV_NEXT]] = add nuw nsw i32 [[LSR_IV]], -1
94-
; CHECK-NEXT: [[LSR_IV_NEXT1:%.*]] = inttoptr i32 [[LSR_IV_NEXT]] to i8*
95-
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[LSR_IV_NEXT1]], null
97+
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i8* [ [[SCEVGEP1:%.*]], [[ITER:%.*]] ], [ [[SCEVGEP]], [[BLAH:%.*]] ]
98+
; CHECK-NEXT: [[SCEVGEP1]] = getelementptr i8, i8* [[LSR_IV]], i32 1
99+
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[SCEVGEP1]], undef
96100
; CHECK-NEXT: br i1 [[TMP100]], label [[UNWIND_OUT:%.*]], label [[ITER]]
97101
; CHECK: iter:
98102
; CHECK-NEXT: br i1 true, label [[UNWIND_OUT]], label [[LOOP_BODY]]
@@ -138,6 +142,7 @@ define void @h() personality i32 (...)* @_except_handler3 {
138142
; CHECK-NEXT: entry:
139143
; CHECK-NEXT: br label [[THROW:%.*]]
140144
; CHECK: throw:
145+
; CHECK-NEXT: [[TMP96:%.*]] = getelementptr inbounds i8, i8* undef, i32 1
141146
; CHECK-NEXT: invoke void @reserve()
142147
; CHECK-NEXT: to label [[THROW]] unwind label [[PAD:%.*]]
143148
; CHECK: pad:
@@ -146,17 +151,18 @@ define void @h() personality i32 (...)* @_except_handler3 {
146151
; CHECK-NEXT: [[TMP0:%.*]] = catchpad within [[CS]] []
147152
; CHECK-NEXT: unreachable
148153
; CHECK: blug:
154+
; CHECK-NEXT: [[PHI2:%.*]] = phi i8* [ [[TMP96]], [[PAD]] ]
149155
; CHECK-NEXT: [[CATCHPAD:%.*]] = catchpad within [[CS]] []
156+
; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, i8* [[PHI2]], i32 -1
150157
; CHECK-NEXT: br label [[LOOP_BODY:%.*]]
151158
; CHECK: unwind_out:
152159
; CHECK-NEXT: catchret from [[CATCHPAD]] to label [[LEAVE:%.*]]
153160
; CHECK: leave:
154161
; CHECK-NEXT: ret void
155162
; CHECK: loop_body:
156-
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i32 [ [[LSR_IV_NEXT:%.*]], [[ITER:%.*]] ], [ 0, [[BLUG:%.*]] ]
157-
; CHECK-NEXT: [[LSR_IV_NEXT]] = add nuw nsw i32 [[LSR_IV]], -1
158-
; CHECK-NEXT: [[LSR_IV_NEXT1:%.*]] = inttoptr i32 [[LSR_IV_NEXT]] to i8*
159-
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[LSR_IV_NEXT1]], null
163+
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i8* [ [[SCEVGEP1:%.*]], [[ITER:%.*]] ], [ [[SCEVGEP]], [[BLUG:%.*]] ]
164+
; CHECK-NEXT: [[SCEVGEP1]] = getelementptr i8, i8* [[LSR_IV]], i32 1
165+
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[SCEVGEP1]], undef
160166
; CHECK-NEXT: br i1 [[TMP100]], label [[UNWIND_OUT:%.*]], label [[ITER]]
161167
; CHECK: iter:
162168
; CHECK-NEXT: br i1 true, label [[UNWIND_OUT]], label [[LOOP_BODY]]
@@ -202,9 +208,11 @@ define void @i() personality i32 (...)* @_except_handler3 {
202208
; CHECK-NEXT: entry:
203209
; CHECK-NEXT: br label [[THROW:%.*]]
204210
; CHECK: throw:
211+
; CHECK-NEXT: [[TMP96:%.*]] = getelementptr inbounds i8, i8* undef, i32 1
205212
; CHECK-NEXT: invoke void @reserve()
206213
; CHECK-NEXT: to label [[THROW]] unwind label [[CATCHPAD:%.*]]
207214
; CHECK: catchpad:
215+
; CHECK-NEXT: [[PHI2:%.*]] = phi i8* [ [[TMP96]], [[THROW]] ]
208216
; CHECK-NEXT: [[CS:%.*]] = catchswitch within none [label %cp_body] unwind label [[CLEANUPPAD:%.*]]
209217
; CHECK: cp_body:
210218
; CHECK-NEXT: [[TMP0:%.*]] = catchpad within [[CS]] []
@@ -213,12 +221,12 @@ define void @i() personality i32 (...)* @_except_handler3 {
213221
; CHECK-NEXT: [[TMP1:%.*]] = cleanuppad within none []
214222
; CHECK-NEXT: br label [[LOOP_HEAD]]
215223
; CHECK: loop_head:
224+
; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, i8* [[PHI2]], i32 -1
216225
; CHECK-NEXT: br label [[LOOP_BODY:%.*]]
217226
; CHECK: loop_body:
218-
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i32 [ [[LSR_IV_NEXT:%.*]], [[ITER:%.*]] ], [ 0, [[LOOP_HEAD]] ]
219-
; CHECK-NEXT: [[LSR_IV_NEXT]] = add nuw nsw i32 [[LSR_IV]], -1
220-
; CHECK-NEXT: [[LSR_IV_NEXT1:%.*]] = inttoptr i32 [[LSR_IV_NEXT]] to i8*
221-
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[LSR_IV_NEXT1]], null
227+
; CHECK-NEXT: [[LSR_IV:%.*]] = phi i8* [ [[SCEVGEP1:%.*]], [[ITER:%.*]] ], [ [[SCEVGEP]], [[LOOP_HEAD]] ]
228+
; CHECK-NEXT: [[SCEVGEP1]] = getelementptr i8, i8* [[LSR_IV]], i32 1
229+
; CHECK-NEXT: [[TMP100:%.*]] = icmp eq i8* [[SCEVGEP1]], undef
222230
; CHECK-NEXT: br i1 [[TMP100]], label [[UNWIND_OUT:%.*]], label [[ITER]]
223231
; CHECK: iter:
224232
; CHECK-NEXT: br i1 true, label [[UNWIND_OUT]], label [[LOOP_BODY]]

llvm/test/Transforms/LoopVectorize/pr45259.ll

Lines changed: 33 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -6,62 +6,61 @@
66
define i8 @widget(i8* %arr, i8 %t9) {
77
; CHECK-LABEL: @widget(
88
; CHECK-NEXT: bb:
9-
; CHECK-NEXT: [[ARR1:%.*]] = ptrtoint i8* [[ARR:%.*]] to i64
9+
; CHECK-NEXT: [[ARR2:%.*]] = ptrtoint i8* [[ARR:%.*]] to i64
1010
; CHECK-NEXT: br label [[BB6:%.*]]
1111
; CHECK: bb6:
1212
; CHECK-NEXT: [[T1_0:%.*]] = phi i8* [ [[ARR]], [[BB:%.*]] ], [ null, [[BB6]] ]
1313
; CHECK-NEXT: [[C:%.*]] = call i1 @cond()
1414
; CHECK-NEXT: br i1 [[C]], label [[FOR_PREHEADER:%.*]], label [[BB6]]
1515
; CHECK: for.preheader:
1616
; CHECK-NEXT: [[T1_0_LCSSA:%.*]] = phi i8* [ [[T1_0]], [[BB6]] ]
17-
; CHECK-NEXT: [[T1_0_LCSSA2:%.*]] = ptrtoint i8* [[T1_0_LCSSA]] to i64
18-
; CHECK-NEXT: [[TMP0:%.*]] = trunc i64 [[ARR1]] to i32
19-
; CHECK-NEXT: [[TMP1:%.*]] = sub i32 0, [[TMP0]]
20-
; CHECK-NEXT: [[TMP2:%.*]] = trunc i64 [[T1_0_LCSSA2]] to i32
21-
; CHECK-NEXT: [[TMP3:%.*]] = add i32 [[TMP1]], [[TMP2]]
22-
; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i32 [[TMP3]], 4
17+
; CHECK-NEXT: [[T1_0_LCSSA1:%.*]] = ptrtoint i8* [[T1_0_LCSSA]] to i64
18+
; CHECK-NEXT: [[TMP0:%.*]] = trunc i64 [[T1_0_LCSSA1]] to i32
19+
; CHECK-NEXT: [[TMP1:%.*]] = trunc i64 [[ARR2]] to i32
20+
; CHECK-NEXT: [[TMP2:%.*]] = sub i32 [[TMP0]], [[TMP1]]
21+
; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i32 [[TMP2]], 4
2322
; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label [[SCALAR_PH:%.*]], label [[VECTOR_SCEVCHECK:%.*]]
2423
; CHECK: vector.scevcheck:
25-
; CHECK-NEXT: [[TMP4:%.*]] = sub i64 -1, [[ARR1]]
26-
; CHECK-NEXT: [[TMP5:%.*]] = add i64 [[TMP4]], [[T1_0_LCSSA2]]
27-
; CHECK-NEXT: [[TMP6:%.*]] = trunc i64 [[TMP5]] to i8
28-
; CHECK-NEXT: [[MUL:%.*]] = call { i8, i1 } @llvm.umul.with.overflow.i8(i8 1, i8 [[TMP6]])
24+
; CHECK-NEXT: [[TMP3:%.*]] = add i64 [[T1_0_LCSSA1]], -1
25+
; CHECK-NEXT: [[TMP4:%.*]] = sub i64 [[TMP3]], [[ARR2]]
26+
; CHECK-NEXT: [[TMP5:%.*]] = trunc i64 [[TMP4]] to i8
27+
; CHECK-NEXT: [[MUL:%.*]] = call { i8, i1 } @llvm.umul.with.overflow.i8(i8 1, i8 [[TMP5]])
2928
; CHECK-NEXT: [[MUL_RESULT:%.*]] = extractvalue { i8, i1 } [[MUL]], 0
3029
; CHECK-NEXT: [[MUL_OVERFLOW:%.*]] = extractvalue { i8, i1 } [[MUL]], 1
31-
; CHECK-NEXT: [[TMP7:%.*]] = add i8 1, [[MUL_RESULT]]
32-
; CHECK-NEXT: [[TMP8:%.*]] = sub i8 1, [[MUL_RESULT]]
33-
; CHECK-NEXT: [[TMP9:%.*]] = icmp sgt i8 [[TMP8]], 1
34-
; CHECK-NEXT: [[TMP10:%.*]] = icmp slt i8 [[TMP7]], 1
35-
; CHECK-NEXT: [[TMP11:%.*]] = select i1 false, i1 [[TMP9]], i1 [[TMP10]]
36-
; CHECK-NEXT: [[TMP12:%.*]] = icmp ugt i64 [[TMP5]], 255
37-
; CHECK-NEXT: [[TMP13:%.*]] = or i1 [[TMP11]], [[TMP12]]
38-
; CHECK-NEXT: [[TMP14:%.*]] = or i1 [[TMP13]], [[MUL_OVERFLOW]]
39-
; CHECK-NEXT: [[TMP15:%.*]] = or i1 false, [[TMP14]]
40-
; CHECK-NEXT: br i1 [[TMP15]], label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
30+
; CHECK-NEXT: [[TMP6:%.*]] = add i8 1, [[MUL_RESULT]]
31+
; CHECK-NEXT: [[TMP7:%.*]] = sub i8 1, [[MUL_RESULT]]
32+
; CHECK-NEXT: [[TMP8:%.*]] = icmp sgt i8 [[TMP7]], 1
33+
; CHECK-NEXT: [[TMP9:%.*]] = icmp slt i8 [[TMP6]], 1
34+
; CHECK-NEXT: [[TMP10:%.*]] = select i1 false, i1 [[TMP8]], i1 [[TMP9]]
35+
; CHECK-NEXT: [[TMP11:%.*]] = icmp ugt i64 [[TMP4]], 255
36+
; CHECK-NEXT: [[TMP12:%.*]] = or i1 [[TMP10]], [[TMP11]]
37+
; CHECK-NEXT: [[TMP13:%.*]] = or i1 [[TMP12]], [[MUL_OVERFLOW]]
38+
; CHECK-NEXT: [[TMP14:%.*]] = or i1 false, [[TMP13]]
39+
; CHECK-NEXT: br i1 [[TMP14]], label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
4140
; CHECK: vector.ph:
42-
; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i32 [[TMP3]], 4
43-
; CHECK-NEXT: [[N_VEC:%.*]] = sub i32 [[TMP3]], [[N_MOD_VF]]
41+
; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i32 [[TMP2]], 4
42+
; CHECK-NEXT: [[N_VEC:%.*]] = sub i32 [[TMP2]], [[N_MOD_VF]]
4443
; CHECK-NEXT: [[IND_END:%.*]] = trunc i32 [[N_VEC]] to i8
4544
; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i8> poison, i8 [[T9:%.*]], i32 0
4645
; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i8> [[BROADCAST_SPLATINSERT]], <4 x i8> poison, <4 x i32> zeroinitializer
4746
; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
4847
; CHECK: vector.body:
4948
; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
5049
; CHECK-NEXT: [[VEC_IND:%.*]] = phi <4 x i8> [ <i8 0, i8 1, i8 2, i8 3>, [[VECTOR_PH]] ], [ [[VEC_IND_NEXT:%.*]], [[VECTOR_BODY]] ]
51-
; CHECK-NEXT: [[TMP16:%.*]] = add <4 x i8> [[VEC_IND]], <i8 1, i8 1, i8 1, i8 1>
52-
; CHECK-NEXT: [[TMP17:%.*]] = extractelement <4 x i8> [[TMP16]], i32 0
53-
; CHECK-NEXT: [[TMP18:%.*]] = getelementptr inbounds i8, i8* [[ARR]], i8 [[TMP17]]
54-
; CHECK-NEXT: [[TMP19:%.*]] = icmp slt <4 x i8> [[TMP16]], [[BROADCAST_SPLAT]]
55-
; CHECK-NEXT: [[TMP20:%.*]] = zext <4 x i1> [[TMP19]] to <4 x i8>
56-
; CHECK-NEXT: [[TMP21:%.*]] = getelementptr inbounds i8, i8* [[TMP18]], i32 0
57-
; CHECK-NEXT: [[TMP22:%.*]] = bitcast i8* [[TMP21]] to <4 x i8>*
58-
; CHECK-NEXT: store <4 x i8> [[TMP20]], <4 x i8>* [[TMP22]], align 1
50+
; CHECK-NEXT: [[TMP15:%.*]] = add <4 x i8> [[VEC_IND]], <i8 1, i8 1, i8 1, i8 1>
51+
; CHECK-NEXT: [[TMP16:%.*]] = extractelement <4 x i8> [[TMP15]], i32 0
52+
; CHECK-NEXT: [[TMP17:%.*]] = getelementptr inbounds i8, i8* [[ARR]], i8 [[TMP16]]
53+
; CHECK-NEXT: [[TMP18:%.*]] = icmp slt <4 x i8> [[TMP15]], [[BROADCAST_SPLAT]]
54+
; CHECK-NEXT: [[TMP19:%.*]] = zext <4 x i1> [[TMP18]] to <4 x i8>
55+
; CHECK-NEXT: [[TMP20:%.*]] = getelementptr inbounds i8, i8* [[TMP17]], i32 0
56+
; CHECK-NEXT: [[TMP21:%.*]] = bitcast i8* [[TMP20]] to <4 x i8>*
57+
; CHECK-NEXT: store <4 x i8> [[TMP19]], <4 x i8>* [[TMP21]], align 1
5958
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4
6059
; CHECK-NEXT: [[VEC_IND_NEXT]] = add <4 x i8> [[VEC_IND]], <i8 4, i8 4, i8 4, i8 4>
61-
; CHECK-NEXT: [[TMP23:%.*]] = icmp eq i32 [[INDEX_NEXT]], [[N_VEC]]
62-
; CHECK-NEXT: br i1 [[TMP23]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
60+
; CHECK-NEXT: [[TMP22:%.*]] = icmp eq i32 [[INDEX_NEXT]], [[N_VEC]]
61+
; CHECK-NEXT: br i1 [[TMP22]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
6362
; CHECK: middle.block:
64-
; CHECK-NEXT: [[CMP_N:%.*]] = icmp eq i32 [[TMP3]], [[N_VEC]]
63+
; CHECK-NEXT: [[CMP_N:%.*]] = icmp eq i32 [[TMP2]], [[N_VEC]]
6564
; CHECK-NEXT: br i1 [[CMP_N]], label [[FOR_EXIT:%.*]], label [[SCALAR_PH]]
6665
; CHECK: scalar.ph:
6766
; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i8 [ [[IND_END]], [[MIDDLE_BLOCK]] ], [ 0, [[FOR_PREHEADER]] ], [ 0, [[VECTOR_SCEVCHECK]] ]

0 commit comments

Comments
 (0)