@@ -8,60 +8,14 @@ define void @foo(ptr noalias %a, i64 %N) {
8
8
; CHECK-LABEL: define void @foo(
9
9
; CHECK-SAME: ptr noalias [[A:%.*]], i64 [[N:%.*]]) #[[ATTR0:[0-9]+]] {
10
10
; CHECK-NEXT: entry:
11
- ; CHECK-NEXT: [[TMP0:%.*]] = sub i64 -1, [[N]]
12
- ; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.vscale.i64()
13
- ; CHECK-NEXT: [[TMP2:%.*]] = mul i64 [[TMP1]], 2
14
- ; CHECK-NEXT: [[TMP3:%.*]] = icmp ult i64 [[TMP0]], [[TMP2]]
15
- ; CHECK-NEXT: br i1 [[TMP3]], label [[SCALAR_PH:%.*]], label [[ENTRY:%.*]]
16
- ; CHECK: vector.ph:
17
- ; CHECK-NEXT: [[TMP4:%.*]] = call i64 @llvm.vscale.i64()
18
- ; CHECK-NEXT: [[TMP5:%.*]] = mul i64 [[TMP4]], 2
19
- ; CHECK-NEXT: [[TMP6:%.*]] = call i64 @llvm.vscale.i64()
20
- ; CHECK-NEXT: [[TMP7:%.*]] = mul i64 [[TMP6]], 2
21
- ; CHECK-NEXT: [[TMP8:%.*]] = sub i64 [[TMP7]], 1
22
- ; CHECK-NEXT: [[N_RND_UP:%.*]] = add i64 [[N]], [[TMP8]]
23
- ; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i64 [[N_RND_UP]], [[TMP5]]
24
- ; CHECK-NEXT: [[N_VEC:%.*]] = sub i64 [[N_RND_UP]], [[N_MOD_VF]]
25
- ; CHECK-NEXT: [[TMP9:%.*]] = call i64 @llvm.vscale.i64()
26
- ; CHECK-NEXT: [[TMP10:%.*]] = mul i64 [[TMP9]], 2
27
- ; CHECK-NEXT: [[TMP11:%.*]] = call <vscale x 2 x i64> @llvm.experimental.stepvector.nxv2i64()
28
- ; CHECK-NEXT: [[TMP12:%.*]] = add <vscale x 2 x i64> [[TMP11]], zeroinitializer
29
- ; CHECK-NEXT: [[TMP13:%.*]] = mul <vscale x 2 x i64> [[TMP12]], shufflevector (<vscale x 2 x i64> insertelement (<vscale x 2 x i64> poison, i64 1, i64 0), <vscale x 2 x i64> poison, <vscale x 2 x i32> zeroinitializer)
30
- ; CHECK-NEXT: [[INDUCTION:%.*]] = add <vscale x 2 x i64> zeroinitializer, [[TMP13]]
31
- ; CHECK-NEXT: [[TMP14:%.*]] = call i64 @llvm.vscale.i64()
32
- ; CHECK-NEXT: [[TMP15:%.*]] = mul i64 [[TMP14]], 2
33
- ; CHECK-NEXT: [[TMP16:%.*]] = mul i64 1, [[TMP15]]
34
- ; CHECK-NEXT: [[DOTSPLATINSERT:%.*]] = insertelement <vscale x 2 x i64> poison, i64 [[TMP16]], i64 0
35
- ; CHECK-NEXT: [[DOTSPLAT:%.*]] = shufflevector <vscale x 2 x i64> [[DOTSPLATINSERT]], <vscale x 2 x i64> poison, <vscale x 2 x i32> zeroinitializer
36
- ; CHECK-NEXT: br label [[FOR_BODY:%.*]]
37
- ; CHECK: vector.body:
38
- ; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, [[ENTRY]] ], [ [[IV_NEXT:%.*]], [[FOR_BODY]] ]
39
- ; CHECK-NEXT: [[EVL_BASED_IV:%.*]] = phi i64 [ 0, [[ENTRY]] ], [ [[INDEX_EVL_NEXT:%.*]], [[FOR_BODY]] ]
40
- ; CHECK-NEXT: [[VEC_IND:%.*]] = phi <vscale x 2 x i64> [ [[INDUCTION]], [[ENTRY]] ], [ [[VEC_IND_NEXT:%.*]], [[FOR_BODY]] ]
41
- ; CHECK-NEXT: [[TMP17:%.*]] = sub i64 [[N]], [[EVL_BASED_IV]]
42
- ; CHECK-NEXT: [[TMP18:%.*]] = call i32 @llvm.experimental.get.vector.length.i64(i64 [[TMP17]], i32 2, i1 true)
43
- ; CHECK-NEXT: [[TMP19:%.*]] = add i64 [[EVL_BASED_IV]], 0
44
- ; CHECK-NEXT: [[TMP20:%.*]] = getelementptr inbounds i64, ptr [[A]], i64 [[TMP19]]
45
- ; CHECK-NEXT: [[TMP21:%.*]] = getelementptr inbounds i64, ptr [[TMP20]], i32 0
46
- ; CHECK-NEXT: call void @llvm.vp.store.nxv2i64.p0(<vscale x 2 x i64> [[VEC_IND]], ptr align 8 [[TMP21]], <vscale x 2 x i1> shufflevector (<vscale x 2 x i1> insertelement (<vscale x 2 x i1> poison, i1 true, i64 0), <vscale x 2 x i1> poison, <vscale x 2 x i32> zeroinitializer), i32 [[TMP18]])
47
- ; CHECK-NEXT: [[TMP22:%.*]] = zext i32 [[TMP18]] to i64
48
- ; CHECK-NEXT: [[INDEX_EVL_NEXT]] = add i64 [[TMP22]], [[EVL_BASED_IV]]
49
- ; CHECK-NEXT: [[IV_NEXT]] = add i64 [[IV]], [[TMP10]]
50
- ; CHECK-NEXT: [[VEC_IND_NEXT]] = add <vscale x 2 x i64> [[VEC_IND]], [[DOTSPLAT]]
51
- ; CHECK-NEXT: [[TMP23:%.*]] = icmp eq i64 [[IV_NEXT]], [[N_VEC]]
52
- ; CHECK-NEXT: br i1 [[TMP23]], label [[MIDDLE_BLOCK:%.*]], label [[FOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
53
- ; CHECK: middle.block:
54
- ; CHECK-NEXT: br i1 true, label [[FOR_COND_CLEANUP:%.*]], label [[SCALAR_PH]]
55
- ; CHECK: scalar.ph:
56
- ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[N_VEC]], [[MIDDLE_BLOCK]] ], [ 0, [[ENTRY1:%.*]] ]
57
11
; CHECK-NEXT: br label [[FOR_BODY1:%.*]]
58
12
; CHECK: for.body:
59
- ; CHECK-NEXT: [[IV1:%.*]] = phi i64 [ [[BC_RESUME_VAL]] , [[SCALAR_PH ]] ], [ [[IV_NEXT1:%.*]], [[FOR_BODY1]] ]
13
+ ; CHECK-NEXT: [[IV1:%.*]] = phi i64 [ 0 , [[ENTRY:%.* ]] ], [ [[IV_NEXT1:%.*]], [[FOR_BODY1]] ]
60
14
; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i64, ptr [[A]], i64 [[IV1]]
61
15
; CHECK-NEXT: store i64 [[IV1]], ptr [[ARRAYIDX]], align 8
62
16
; CHECK-NEXT: [[IV_NEXT1]] = add nuw nsw i64 [[IV1]], 1
63
17
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT1]], [[N]]
64
- ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_COND_CLEANUP]], label [[FOR_BODY1]], !llvm.loop [[LOOP3:![0-9]+ ]]
18
+ ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_COND_CLEANUP:%.* ]], label [[FOR_BODY1]]
65
19
; CHECK: for.cond.cleanup:
66
20
; CHECK-NEXT: ret void
67
21
;
@@ -85,67 +39,16 @@ define void @foo2(ptr noalias %a, ptr noalias %b, i64 %N) {
85
39
; CHECK-LABEL: define void @foo2(
86
40
; CHECK-SAME: ptr noalias [[A:%.*]], ptr noalias [[B:%.*]], i64 [[N:%.*]]) #[[ATTR0]] {
87
41
; CHECK-NEXT: entry:
88
- ; CHECK-NEXT: [[TMP0:%.*]] = sub i64 -1, [[N]]
89
- ; CHECK-NEXT: [[TMP1:%.*]] = call i64 @llvm.vscale.i64()
90
- ; CHECK-NEXT: [[TMP2:%.*]] = mul i64 [[TMP1]], 2
91
- ; CHECK-NEXT: [[TMP3:%.*]] = icmp ult i64 [[TMP0]], [[TMP2]]
92
- ; CHECK-NEXT: br i1 [[TMP3]], label [[SCALAR_PH:%.*]], label [[ENTRY:%.*]]
93
- ; CHECK: vector.ph:
94
- ; CHECK-NEXT: [[TMP4:%.*]] = call i64 @llvm.vscale.i64()
95
- ; CHECK-NEXT: [[TMP5:%.*]] = mul i64 [[TMP4]], 2
96
- ; CHECK-NEXT: [[TMP6:%.*]] = call i64 @llvm.vscale.i64()
97
- ; CHECK-NEXT: [[TMP7:%.*]] = mul i64 [[TMP6]], 2
98
- ; CHECK-NEXT: [[TMP8:%.*]] = sub i64 [[TMP7]], 1
99
- ; CHECK-NEXT: [[N_RND_UP:%.*]] = add i64 [[N]], [[TMP8]]
100
- ; CHECK-NEXT: [[N_MOD_VF:%.*]] = urem i64 [[N_RND_UP]], [[TMP5]]
101
- ; CHECK-NEXT: [[N_VEC:%.*]] = sub i64 [[N_RND_UP]], [[N_MOD_VF]]
102
- ; CHECK-NEXT: [[TMP9:%.*]] = mul i64 [[N_VEC]], 8
103
- ; CHECK-NEXT: [[IND_END:%.*]] = getelementptr i8, ptr [[B]], i64 [[TMP9]]
104
- ; CHECK-NEXT: [[TMP10:%.*]] = call i64 @llvm.vscale.i64()
105
- ; CHECK-NEXT: [[TMP11:%.*]] = mul i64 [[TMP10]], 2
106
42
; CHECK-NEXT: br label [[FOR_BODY:%.*]]
107
- ; CHECK: vector.body:
108
- ; CHECK-NEXT: [[POINTER_PHI:%.*]] = phi ptr [ [[B]], [[ENTRY]] ], [ [[PTR_IND:%.*]], [[FOR_BODY]] ]
109
- ; CHECK-NEXT: [[IV:%.*]] = phi i64 [ 0, [[ENTRY]] ], [ [[IV_NEXT:%.*]], [[FOR_BODY]] ]
110
- ; CHECK-NEXT: [[EVL_BASED_IV:%.*]] = phi i64 [ 0, [[ENTRY]] ], [ [[INDEX_EVL_NEXT:%.*]], [[FOR_BODY]] ]
111
- ; CHECK-NEXT: [[TMP12:%.*]] = call i64 @llvm.vscale.i64()
112
- ; CHECK-NEXT: [[TMP13:%.*]] = mul i64 [[TMP12]], 2
113
- ; CHECK-NEXT: [[TMP14:%.*]] = mul i64 [[TMP13]], 1
114
- ; CHECK-NEXT: [[TMP15:%.*]] = mul i64 8, [[TMP14]]
115
- ; CHECK-NEXT: [[TMP16:%.*]] = mul i64 [[TMP13]], 0
116
- ; CHECK-NEXT: [[DOTSPLATINSERT:%.*]] = insertelement <vscale x 2 x i64> poison, i64 [[TMP16]], i64 0
117
- ; CHECK-NEXT: [[DOTSPLAT:%.*]] = shufflevector <vscale x 2 x i64> [[DOTSPLATINSERT]], <vscale x 2 x i64> poison, <vscale x 2 x i32> zeroinitializer
118
- ; CHECK-NEXT: [[TMP17:%.*]] = call <vscale x 2 x i64> @llvm.experimental.stepvector.nxv2i64()
119
- ; CHECK-NEXT: [[TMP18:%.*]] = add <vscale x 2 x i64> [[DOTSPLAT]], [[TMP17]]
120
- ; CHECK-NEXT: [[VECTOR_GEP:%.*]] = mul <vscale x 2 x i64> [[TMP18]], shufflevector (<vscale x 2 x i64> insertelement (<vscale x 2 x i64> poison, i64 8, i64 0), <vscale x 2 x i64> poison, <vscale x 2 x i32> zeroinitializer)
121
- ; CHECK-NEXT: [[TMP19:%.*]] = getelementptr i8, ptr [[POINTER_PHI]], <vscale x 2 x i64> [[VECTOR_GEP]]
122
- ; CHECK-NEXT: [[TMP20:%.*]] = sub i64 [[N]], [[EVL_BASED_IV]]
123
- ; CHECK-NEXT: [[TMP21:%.*]] = call i32 @llvm.experimental.get.vector.length.i64(i64 [[TMP20]], i32 2, i1 true)
124
- ; CHECK-NEXT: [[TMP22:%.*]] = add i64 [[EVL_BASED_IV]], 0
125
- ; CHECK-NEXT: [[TMP23:%.*]] = getelementptr inbounds i64, ptr [[A]], i64 [[TMP22]]
126
- ; CHECK-NEXT: [[TMP24:%.*]] = getelementptr inbounds ptr, ptr [[TMP23]], i32 0
127
- ; CHECK-NEXT: call void @llvm.vp.store.nxv2p0.p0(<vscale x 2 x ptr> [[TMP19]], ptr align 8 [[TMP24]], <vscale x 2 x i1> shufflevector (<vscale x 2 x i1> insertelement (<vscale x 2 x i1> poison, i1 true, i64 0), <vscale x 2 x i1> poison, <vscale x 2 x i32> zeroinitializer), i32 [[TMP21]])
128
- ; CHECK-NEXT: [[TMP25:%.*]] = zext i32 [[TMP21]] to i64
129
- ; CHECK-NEXT: [[INDEX_EVL_NEXT]] = add i64 [[TMP25]], [[EVL_BASED_IV]]
130
- ; CHECK-NEXT: [[IV_NEXT]] = add i64 [[IV]], [[TMP11]]
131
- ; CHECK-NEXT: [[PTR_IND]] = getelementptr i8, ptr [[POINTER_PHI]], i64 [[TMP15]]
132
- ; CHECK-NEXT: [[TMP26:%.*]] = icmp eq i64 [[IV_NEXT]], [[N_VEC]]
133
- ; CHECK-NEXT: br i1 [[TMP26]], label [[MIDDLE_BLOCK:%.*]], label [[FOR_BODY]], !llvm.loop [[LOOP4:![0-9]+]]
134
- ; CHECK: middle.block:
135
- ; CHECK-NEXT: br i1 true, label [[FOR_COND_CLEANUP:%.*]], label [[SCALAR_PH]]
136
- ; CHECK: scalar.ph:
137
- ; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[N_VEC]], [[MIDDLE_BLOCK]] ], [ 0, [[ENTRY1:%.*]] ]
138
- ; CHECK-NEXT: [[BC_RESUME_VAL1:%.*]] = phi ptr [ [[IND_END]], [[MIDDLE_BLOCK]] ], [ [[B]], [[ENTRY1]] ]
139
- ; CHECK-NEXT: br label [[FOR_BODY1:%.*]]
140
43
; CHECK: for.body:
141
- ; CHECK-NEXT: [[IV1 :%.*]] = phi i64 [ [[BC_RESUME_VAL]] , [[SCALAR_PH ]] ], [ [[IV_NEXT1 :%.*]], [[FOR_BODY1 ]] ]
142
- ; CHECK-NEXT: [[ADDR:%.*]] = phi ptr [ [[INCDEC_PTR:%.*]], [[FOR_BODY1 ]] ], [ [[BC_RESUME_VAL1 ]], [[SCALAR_PH ]] ]
44
+ ; CHECK-NEXT: [[EVL_BASED_IV :%.*]] = phi i64 [ 0 , [[ENTRY:%.* ]] ], [ [[INDEX_EVL_NEXT :%.*]], [[FOR_BODY ]] ]
45
+ ; CHECK-NEXT: [[ADDR:%.*]] = phi ptr [ [[INCDEC_PTR:%.*]], [[FOR_BODY ]] ], [ [[B ]], [[ENTRY ]] ]
143
46
; CHECK-NEXT: [[INCDEC_PTR]] = getelementptr inbounds i8, ptr [[ADDR]], i64 8
144
- ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i64, ptr [[A]], i64 [[IV1 ]]
47
+ ; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i64, ptr [[A]], i64 [[EVL_BASED_IV ]]
145
48
; CHECK-NEXT: store ptr [[ADDR]], ptr [[ARRAYIDX]], align 8
146
- ; CHECK-NEXT: [[IV_NEXT1 ]] = add nuw nsw i64 [[IV1 ]], 1
147
- ; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT1 ]], [[N]]
148
- ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_COND_CLEANUP]], label [[FOR_BODY1]], !llvm.loop [[LOOP5:![0-9]+ ]]
49
+ ; CHECK-NEXT: [[INDEX_EVL_NEXT ]] = add nuw nsw i64 [[EVL_BASED_IV ]], 1
50
+ ; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[INDEX_EVL_NEXT ]], [[N]]
51
+ ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_COND_CLEANUP:%.* ]], label [[FOR_BODY ]]
149
52
; CHECK: for.cond.cleanup:
150
53
; CHECK-NEXT: ret void
151
54
;
@@ -217,7 +120,7 @@ define void @foo3(ptr noalias %a, i64 %N) {
217
120
; CHECK-NEXT: call void @llvm.masked.store.nxv2i64.p0(<vscale x 2 x i64> [[REVERSE6]], ptr [[TMP21]], i32 8, <vscale x 2 x i1> [[REVERSE]])
218
121
; CHECK-NEXT: [[INDEX_EVL_NEXT]] = add i64 [[EVL_BASED_IV]], [[TMP11]]
219
122
; CHECK-NEXT: [[TMP22:%.*]] = icmp eq i64 [[INDEX_EVL_NEXT]], [[N_VEC]]
220
- ; CHECK-NEXT: br i1 [[TMP22]], label [[MIDDLE_BLOCK:%.*]], label [[FOR_BODY]], !llvm.loop [[LOOP6 :![0-9]+]]
123
+ ; CHECK-NEXT: br i1 [[TMP22]], label [[MIDDLE_BLOCK:%.*]], label [[FOR_BODY]], !llvm.loop [[LOOP0 :![0-9]+]]
221
124
; CHECK: middle.block:
222
125
; CHECK-NEXT: br i1 true, label [[FOR_COND_CLEANUP:%.*]], label [[SCALAR_PH]]
223
126
; CHECK: scalar.ph:
@@ -231,7 +134,7 @@ define void @foo3(ptr noalias %a, i64 %N) {
231
134
; CHECK-NEXT: store i64 [[N]], ptr [[ADDR]], align 8
232
135
; CHECK-NEXT: [[IV_NEXT]] = add nuw nsw i64 [[IV]], 1
233
136
; CHECK-NEXT: [[EXITCOND_NOT:%.*]] = icmp eq i64 [[IV_NEXT]], [[N]]
234
- ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_COND_CLEANUP]], label [[FOR_BODY1]], !llvm.loop [[LOOP7 :![0-9]+]]
137
+ ; CHECK-NEXT: br i1 [[EXITCOND_NOT]], label [[FOR_COND_CLEANUP]], label [[FOR_BODY1]], !llvm.loop [[LOOP3 :![0-9]+]]
235
138
; CHECK: for.cond.cleanup:
236
139
; CHECK-NEXT: ret void
237
140
;
@@ -255,8 +158,4 @@ for.cond.cleanup:
255
158
; CHECK: [[META1]] = !{!"llvm.loop.isvectorized", i32 1}
256
159
; CHECK: [[META2]] = !{!"llvm.loop.unroll.runtime.disable"}
257
160
; CHECK: [[LOOP3]] = distinct !{[[LOOP3]], [[META2]], [[META1]]}
258
- ; CHECK: [[LOOP4]] = distinct !{[[LOOP4]], [[META1]], [[META2]]}
259
- ; CHECK: [[LOOP5]] = distinct !{[[LOOP5]], [[META2]], [[META1]]}
260
- ; CHECK: [[LOOP6]] = distinct !{[[LOOP6]], [[META1]], [[META2]]}
261
- ; CHECK: [[LOOP7]] = distinct !{[[LOOP7]], [[META2]], [[META1]]}
262
161
;.
0 commit comments