Skip to content

Commit 1340ecf

Browse files
committed
[SCEV] Add more tests with zext(add C, %var)<nsw>.
Add extra test coverage for #142599.
1 parent 18e9455 commit 1340ecf

File tree

2 files changed

+143
-0
lines changed

2 files changed

+143
-0
lines changed
Lines changed: 101 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,101 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2+
; RUN: opt -p indvars -S %s | FileCheck %s
3+
4+
target datalayout = "e-m:o-p270:32:32-p271:32:32-p272:64:64-i64:64-i128:128-n32:64-S128-Fn32"
5+
6+
declare void @foo(i32)
7+
8+
define void @add_nsw_zext_fold_results_in_sext(i64 %len) {
9+
; CHECK-LABEL: define void @add_nsw_zext_fold_results_in_sext(
10+
; CHECK-SAME: i64 [[LEN:%.*]]) {
11+
; CHECK-NEXT: [[ENTRY:.*:]]
12+
; CHECK-NEXT: [[LEN_TRUNC:%.*]] = trunc i64 [[LEN]] to i32
13+
; CHECK-NEXT: [[LZ:%.*]] = tail call range(i32 0, 33) i32 @llvm.ctlz.i32(i32 [[LEN_TRUNC]], i1 false)
14+
; CHECK-NEXT: [[SUB_I:%.*]] = lshr i32 [[LZ]], 3
15+
; CHECK-NEXT: [[ADD_I:%.*]] = sub i32 5, [[SUB_I]]
16+
; CHECK-NEXT: [[PRECOND:%.*]] = icmp eq i32 [[SUB_I]], 5
17+
; CHECK-NEXT: br i1 [[PRECOND]], label %[[EXIT:.*]], label %[[LOOP_PREHEADER:.*]]
18+
; CHECK: [[LOOP_PREHEADER]]:
19+
; CHECK-NEXT: [[TMP1:%.*]] = zext nneg i32 [[ADD_I]] to i64
20+
; CHECK-NEXT: br label %[[LOOP:.*]]
21+
; CHECK: [[LOOP]]:
22+
; CHECK-NEXT: [[INDVARS_IV:%.*]] = phi i64 [ [[TMP1]], %[[LOOP_PREHEADER]] ], [ [[INDVARS_IV_NEXT:%.*]], %[[LOOP]] ]
23+
; CHECK-NEXT: [[IV:%.*]] = trunc nuw i64 [[INDVARS_IV]] to i32
24+
; CHECK-NEXT: [[IV_NEXT:%.*]] = add i32 [[IV]], 1
25+
; CHECK-NEXT: [[SH_PROM:%.*]] = zext nneg i32 [[IV_NEXT]] to i64
26+
; CHECK-NEXT: [[SHR:%.*]] = lshr i64 1, [[SH_PROM]]
27+
; CHECK-NEXT: [[TMP0:%.*]] = trunc nuw nsw i64 [[SHR]] to i32
28+
; CHECK-NEXT: call void @foo(i32 [[TMP0]])
29+
; CHECK-NEXT: [[EC:%.*]] = icmp eq i32 [[IV_NEXT]], 0
30+
; CHECK-NEXT: [[INDVARS_IV_NEXT]] = add nuw nsw i64 [[INDVARS_IV]], 1
31+
; CHECK-NEXT: br i1 [[EC]], label %[[EXIT_LOOPEXIT:.*]], label %[[LOOP]]
32+
; CHECK: [[EXIT_LOOPEXIT]]:
33+
; CHECK-NEXT: br label %[[EXIT]]
34+
; CHECK: [[EXIT]]:
35+
; CHECK-NEXT: ret void
36+
;
37+
entry:
38+
%len.trunc = trunc i64 %len to i32
39+
%lz = tail call range(i32 0, 33) i32 @llvm.ctlz.i32(i32 %len.trunc, i1 false)
40+
%sub.i = lshr i32 %lz, 3
41+
%add.i = sub nuw nsw i32 5, %sub.i
42+
%precond = icmp eq i32 %sub.i, 5
43+
br i1 %precond, label %exit, label %loop
44+
45+
loop:
46+
%iv = phi i32 [ %add.i, %entry ], [ %iv.next, %loop ]
47+
%iv.next = add i32 %iv, 1
48+
%sh_prom = zext nneg i32 %iv.next to i64
49+
%shr = lshr i64 1, %sh_prom
50+
%2 = trunc nuw nsw i64 %shr to i32
51+
call void @foo(i32 %2)
52+
%ec = icmp eq i32 %iv.next, 0
53+
br i1 %ec, label %exit, label %loop
54+
55+
exit:
56+
ret void
57+
}
58+
59+
define void @add_nsw_zext_fold_results_in_sext_known_positive(i32 %mask, ptr %src, i1 %c) {
60+
; CHECK-LABEL: define void @add_nsw_zext_fold_results_in_sext_known_positive(
61+
; CHECK-SAME: i32 [[MASK:%.*]], ptr [[SRC:%.*]], i1 [[C:%.*]]) {
62+
; CHECK-NEXT: [[ENTRY:.*:]]
63+
; CHECK-NEXT: [[SPEC_SELECT:%.*]] = select i1 [[C]], i32 0, i32 6
64+
; CHECK-NEXT: [[ADD:%.*]] = add i32 [[SPEC_SELECT]], [[MASK]]
65+
; CHECK-NEXT: [[PRECOND:%.*]] = icmp slt i32 [[ADD]], 0
66+
; CHECK-NEXT: br i1 [[PRECOND]], label %[[EXIT:.*]], label %[[PH:.*]]
67+
; CHECK: [[PH]]:
68+
; CHECK-NEXT: [[TMP0:%.*]] = sub i32 78, [[SPEC_SELECT]]
69+
; CHECK-NEXT: [[TMP1:%.*]] = zext nneg i32 [[TMP0]] to i64
70+
; CHECK-NEXT: [[TMP2:%.*]] = add nuw nsw i64 [[TMP1]], 1
71+
; CHECK-NEXT: br label %[[LOOP:.*]]
72+
; CHECK: [[LOOP]]:
73+
; CHECK-NEXT: [[GEP:%.*]] = getelementptr i32, ptr [[SRC]], i64 [[TMP2]]
74+
; CHECK-NEXT: [[L:%.*]] = load i32, ptr [[GEP]], align 1
75+
; CHECK-NEXT: call void @foo(i32 [[L]])
76+
; CHECK-NEXT: br label %[[LOOP]]
77+
; CHECK: [[EXIT]]:
78+
; CHECK-NEXT: ret void
79+
;
80+
entry:
81+
%spec.select = select i1 %c, i32 0, i32 6
82+
%add = add i32 %spec.select, %mask
83+
%precond = icmp slt i32 %add, 0
84+
br i1 %precond, label %exit, label %ph
85+
86+
ph:
87+
%start = sub i32 79, %spec.select
88+
br label %loop
89+
90+
loop: ; preds = %loop, %ph
91+
%iv = phi i32 [ %start, %ph ], [ %dec, %loop ]
92+
%iv.ext = zext i32 %iv to i64
93+
%gep = getelementptr i32, ptr %src, i64 %iv.ext
94+
%l = load i32, ptr %gep, align 1
95+
call void @foo(i32 %l)
96+
%dec = add i32 %iv, 0
97+
br label %loop
98+
99+
exit:
100+
ret void
101+
}
Lines changed: 42 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,42 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2+
; RUN: opt -p loop-idiom -S %s | FileCheck %s
3+
4+
define void @fold_add_zext_to_sext(ptr %dst, i1 %start) {
5+
; CHECK-LABEL: define void @fold_add_zext_to_sext(
6+
; CHECK-SAME: ptr [[DST:%.*]], i1 [[START:%.*]]) {
7+
; CHECK-NEXT: [[ENTRY:.*]]:
8+
; CHECK-NEXT: [[START_EXT:%.*]] = zext i1 [[START]] to i32
9+
; CHECK-NEXT: [[TMP0:%.*]] = zext i1 [[START]] to i64
10+
; CHECK-NEXT: [[TMP1:%.*]] = shl nuw nsw i64 [[TMP0]], 2
11+
; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i8, ptr [[DST]], i64 [[TMP1]]
12+
; CHECK-NEXT: [[TMP2:%.*]] = sub i32 25, [[START_EXT]]
13+
; CHECK-NEXT: [[TMP3:%.*]] = zext nneg i32 [[TMP2]] to i64
14+
; CHECK-NEXT: [[TMP4:%.*]] = shl nuw nsw i64 [[TMP3]], 2
15+
; CHECK-NEXT: call void @llvm.memset.p0.i64(ptr align 4 [[SCEVGEP]], i8 0, i64 [[TMP4]], i1 false)
16+
; CHECK-NEXT: br label %[[LOOP:.*]]
17+
; CHECK: [[LOOP]]:
18+
; CHECK-NEXT: [[IV:%.*]] = phi i32 [ [[START_EXT]], %[[ENTRY]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
19+
; CHECK-NEXT: [[IV_EXT:%.*]] = zext i32 [[IV]] to i64
20+
; CHECK-NEXT: [[GEP:%.*]] = getelementptr i32, ptr [[DST]], i64 [[IV_EXT]]
21+
; CHECK-NEXT: [[IV_NEXT]] = add i32 [[IV]], 1
22+
; CHECK-NEXT: [[EC:%.*]] = icmp ult i32 [[IV]], 24
23+
; CHECK-NEXT: br i1 [[EC]], label %[[LOOP]], label %[[EXIT:.*]]
24+
; CHECK: [[EXIT]]:
25+
; CHECK-NEXT: ret void
26+
;
27+
entry:
28+
%start.ext = zext i1 %start to i32
29+
br label %loop
30+
31+
loop:
32+
%iv = phi i32 [ %start.ext, %entry ], [ %iv.next, %loop ]
33+
%iv.ext = zext i32 %iv to i64
34+
%gep = getelementptr i32, ptr %dst, i64 %iv.ext
35+
store i32 0, ptr %gep, align 4
36+
%iv.next = add i32 %iv, 1
37+
%ec = icmp ult i32 %iv, 24
38+
br i1 %ec, label %loop, label %exit
39+
40+
exit:
41+
ret void
42+
}

0 commit comments

Comments
 (0)