1
1
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2
2
; RUN: opt -passes=loop-versioning -S %s | FileCheck %s
3
3
4
- define void @lver.check.unnecessary (ptr %arg , ptr %arg1 , i1 %arg2 ) {
5
- ; CHECK-LABEL: define void @lver.check.unnecessary(
6
- ; CHECK-SAME: ptr [[ARG:%.*]], ptr [[ARG1:%.*]], i1 [[ARG2:%.*]]) {
4
+ ; Callers should not call LoopVersioning on single-iteration loops, as it
5
+ ; is very likely not profitable.
6
+ ; LoopVersioning faithfully versions single-iteration loops when the stride
7
+ ; is unknown.
8
+
9
+ define double @single_iteration_unknown_stride (i32 %x , ptr %y , i1 %cond ) {
10
+ ; CHECK-LABEL: define double @single_iteration_unknown_stride(
11
+ ; CHECK-SAME: i32 [[X:%.*]], ptr [[Y:%.*]], i1 [[COND:%.*]]) {
7
12
; CHECK-NEXT: [[ENTRY:.*:]]
8
- ; CHECK-NEXT: [[LOAD:%.*]] = load i32, ptr [[ARG]], align 4
9
- ; CHECK-NEXT: br i1 [[ARG2]], label %[[NOLOOP_EXIT:.*]], label %[[LOOP_BODY_LVER_CHECK:.*]]
13
+ ; CHECK-NEXT: br i1 [[COND]], label %[[NOLOOP_EXIT:.*]], label %[[LOOP_BODY_LVER_CHECK:.*]]
10
14
; CHECK: [[LOOP_BODY_LVER_CHECK]]:
11
- ; CHECK-NEXT: [[SEXT7:%.*]] = sext i32 [[LOAD ]] to i64
12
- ; CHECK-NEXT: [[GEP8:%.*]] = getelementptr i8, ptr [[ARG1 ]], i64 8
13
- ; CHECK-NEXT: [[IDENT_CHECK:%.*]] = icmp ne i32 [[LOAD ]], 1
15
+ ; CHECK-NEXT: [[SEXT7:%.*]] = sext i32 [[X ]] to i64
16
+ ; CHECK-NEXT: [[GEP8:%.*]] = getelementptr i8, ptr [[Y ]], i64 8
17
+ ; CHECK-NEXT: [[IDENT_CHECK:%.*]] = icmp ne i32 [[X ]], 1
14
18
; CHECK-NEXT: br i1 [[IDENT_CHECK]], label %[[LOOP_BODY_PH_LVER_ORIG:.*]], label %[[LOOP_BODY_PH:.*]]
15
19
; CHECK: [[LOOP_BODY_PH_LVER_ORIG]]:
16
20
; CHECK-NEXT: br label %[[LOOP_BODY_LVER_ORIG:.*]]
@@ -19,7 +23,7 @@ define void @lver.check.unnecessary(ptr %arg, ptr %arg1, i1 %arg2) {
19
23
; CHECK-NEXT: [[MUL_LVER_ORIG:%.*]] = mul i64 [[PHI_LVER_ORIG]], [[SEXT7]]
20
24
; CHECK-NEXT: [[GEP10_LVER_ORIG:%.*]] = getelementptr double, ptr [[GEP8]], i64 [[MUL_LVER_ORIG]]
21
25
; CHECK-NEXT: [[LOAD11_LVER_ORIG:%.*]] = load double, ptr [[GEP10_LVER_ORIG]], align 8
22
- ; CHECK-NEXT: store double [[LOAD11_LVER_ORIG]], ptr [[ARG1 ]], align 8
26
+ ; CHECK-NEXT: store double [[LOAD11_LVER_ORIG]], ptr [[Y ]], align 8
23
27
; CHECK-NEXT: [[ADD_LVER_ORIG]] = add i64 [[PHI_LVER_ORIG]], 1
24
28
; CHECK-NEXT: [[ICMP_LVER_ORIG:%.*]] = icmp eq i64 [[PHI_LVER_ORIG]], 0
25
29
; CHECK-NEXT: br i1 [[ICMP_LVER_ORIG]], label %[[LOOP_EXIT_LOOPEXIT:.*]], label %[[LOOP_BODY_LVER_ORIG]]
@@ -30,49 +34,52 @@ define void @lver.check.unnecessary(ptr %arg, ptr %arg1, i1 %arg2) {
30
34
; CHECK-NEXT: [[MUL:%.*]] = mul i64 [[PHI]], [[SEXT7]]
31
35
; CHECK-NEXT: [[GEP10:%.*]] = getelementptr double, ptr [[GEP8]], i64 [[MUL]]
32
36
; CHECK-NEXT: [[LOAD11:%.*]] = load double, ptr [[GEP10]], align 8
33
- ; CHECK-NEXT: store double [[LOAD11]], ptr [[ARG1 ]], align 8
37
+ ; CHECK-NEXT: store double [[LOAD11]], ptr [[Y ]], align 8
34
38
; CHECK-NEXT: [[ADD]] = add i64 [[PHI]], 1
35
39
; CHECK-NEXT: [[ICMP:%.*]] = icmp eq i64 [[PHI]], 0
36
40
; CHECK-NEXT: br i1 [[ICMP]], label %[[LOOP_EXIT_LOOPEXIT1:.*]], label %[[LOOP_BODY]]
37
41
; CHECK: [[NOLOOP_EXIT]]:
38
- ; CHECK-NEXT: [[SEXT:%.*]] = sext i32 [[LOAD ]] to i64
39
- ; CHECK-NEXT: [[GEP:%.*]] = getelementptr double, ptr [[ARG1 ]], i64 [[SEXT]]
42
+ ; CHECK-NEXT: [[SEXT:%.*]] = sext i32 [[X ]] to i64
43
+ ; CHECK-NEXT: [[GEP:%.*]] = getelementptr double, ptr [[Y ]], i64 [[SEXT]]
40
44
; CHECK-NEXT: [[LOAD5:%.*]] = load double, ptr [[GEP]], align 8
41
- ; CHECK-NEXT: store double [[LOAD5]], ptr [[ARG]], align 8
42
- ; CHECK-NEXT: ret void
45
+ ; CHECK-NEXT: ret double [[LOAD5]]
43
46
; CHECK: [[LOOP_EXIT_LOOPEXIT]]:
44
47
; CHECK-NEXT: br label %[[LOOP_EXIT:.*]]
45
48
; CHECK: [[LOOP_EXIT_LOOPEXIT1]]:
46
49
; CHECK-NEXT: br label %[[LOOP_EXIT]]
47
50
; CHECK: [[LOOP_EXIT]]:
48
- ; CHECK-NEXT: ret void
51
+ ; CHECK-NEXT: [[SEXT2:%.*]] = sext i32 [[X]] to i64
52
+ ; CHECK-NEXT: [[GEP2:%.*]] = getelementptr double, ptr [[Y]], i64 [[SEXT2]]
53
+ ; CHECK-NEXT: [[LOAD6:%.*]] = load double, ptr [[GEP2]], align 8
54
+ ; CHECK-NEXT: ret double [[LOAD6]]
49
55
;
50
56
entry:
51
- %load = load i32 , ptr %arg , align 4
52
- br i1 %arg2 , label %noloop.exit , label %loop.ph
57
+ br i1 %cond , label %noloop.exit , label %loop.ph
53
58
54
59
loop.ph: ; preds = %entry
55
- %sext7 = sext i32 %load to i64
56
- %gep8 = getelementptr i8 , ptr %arg1 , i64 8
60
+ %sext7 = sext i32 %x to i64
61
+ %gep8 = getelementptr i8 , ptr %y , i64 8
57
62
br label %loop.body
58
63
59
64
loop.body: ; preds = %loop.body, %loop.ph
60
- %phi = phi i64 [ 0 , %loop.ph ], [ %add , %loop.body ]
61
- %mul = mul i64 %phi , %sext7
65
+ %iv = phi i64 [ 0 , %loop.ph ], [ %iv.next , %loop.body ]
66
+ %mul = mul i64 %iv , %sext7
62
67
%gep10 = getelementptr double , ptr %gep8 , i64 %mul
63
68
%load11 = load double , ptr %gep10 , align 8
64
- store double %load11 , ptr %arg1 , align 8
65
- %add = add i64 %phi , 1
66
- %icmp = icmp eq i64 %phi , 0
69
+ store double %load11 , ptr %y , align 8
70
+ %iv.next = add i64 %iv , 1
71
+ %icmp = icmp eq i64 %iv , 0
67
72
br i1 %icmp , label %loop.exit , label %loop.body
68
73
69
74
noloop.exit: ; preds = %entry
70
- %sext = sext i32 %load to i64
71
- %gep = getelementptr double , ptr %arg1 , i64 %sext
75
+ %sext = sext i32 %x to i64
76
+ %gep = getelementptr double , ptr %y , i64 %sext
72
77
%load5 = load double , ptr %gep , align 8
73
- store double %load5 , ptr %arg , align 8
74
- ret void
78
+ ret double %load5
75
79
76
80
loop.exit: ; preds = %loop.body
77
- ret void
81
+ %sext2 = sext i32 %x to i64
82
+ %gep2 = getelementptr double , ptr %y , i64 %sext2
83
+ %load6 = load double , ptr %gep2 , align 8
84
+ ret double %load6
78
85
}
0 commit comments