Skip to content

Commit ecc63e7

Browse files
committed
Precommit test
1 parent 316a6ff commit ecc63e7

File tree

1 file changed

+57
-0
lines changed

1 file changed

+57
-0
lines changed
Lines changed: 57 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,57 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --check-globals none --version 5
2+
; RUN: opt < %s -passes=loop-vectorize -force-vector-width=4 -S | FileCheck %s
3+
4+
; Check that we don't unnecessarily broadcast %pow
5+
define void @powi(ptr noalias %p, i32 %pow) {
6+
; CHECK-LABEL: define void @powi(
7+
; CHECK-SAME: ptr noalias [[P:%.*]], i32 [[POW:%.*]]) {
8+
; CHECK-NEXT: [[ENTRY:.*]]:
9+
; CHECK-NEXT: br i1 false, label %[[SCALAR_PH:.*]], label %[[VECTOR_PH:.*]]
10+
; CHECK: [[VECTOR_PH]]:
11+
; CHECK-NEXT: [[BROADCAST_SPLATINSERT:%.*]] = insertelement <4 x i32> poison, i32 [[POW]], i64 0
12+
; CHECK-NEXT: [[BROADCAST_SPLAT:%.*]] = shufflevector <4 x i32> [[BROADCAST_SPLATINSERT]], <4 x i32> poison, <4 x i32> zeroinitializer
13+
; CHECK-NEXT: br label %[[VECTOR_BODY:.*]]
14+
; CHECK: [[VECTOR_BODY]]:
15+
; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, %[[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], %[[VECTOR_BODY]] ]
16+
; CHECK-NEXT: [[TMP0:%.*]] = getelementptr float, ptr [[P]], i32 [[INDEX]]
17+
; CHECK-NEXT: [[TMP1:%.*]] = getelementptr float, ptr [[TMP0]], i32 0
18+
; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <4 x float>, ptr [[TMP1]], align 4
19+
; CHECK-NEXT: [[TMP2:%.*]] = extractelement <4 x i32> [[BROADCAST_SPLAT]], i32 0
20+
; CHECK-NEXT: [[TMP3:%.*]] = call <4 x float> @llvm.powi.v4f32.i32(<4 x float> [[WIDE_LOAD]], i32 [[TMP2]])
21+
; CHECK-NEXT: store <4 x float> [[TMP3]], ptr [[TMP1]], align 4
22+
; CHECK-NEXT: [[INDEX_NEXT]] = add nuw i32 [[INDEX]], 4
23+
; CHECK-NEXT: [[TMP4:%.*]] = icmp eq i32 [[INDEX_NEXT]], 1024
24+
; CHECK-NEXT: br i1 [[TMP4]], label %[[MIDDLE_BLOCK:.*]], label %[[VECTOR_BODY]], !llvm.loop [[LOOP0:![0-9]+]]
25+
; CHECK: [[MIDDLE_BLOCK]]:
26+
; CHECK-NEXT: br i1 true, label %[[EXIT:.*]], label %[[SCALAR_PH]]
27+
; CHECK: [[SCALAR_PH]]:
28+
; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i32 [ 1024, %[[MIDDLE_BLOCK]] ], [ 0, %[[ENTRY]] ]
29+
; CHECK-NEXT: br label %[[LOOP:.*]]
30+
; CHECK: [[LOOP]]:
31+
; CHECK-NEXT: [[IV:%.*]] = phi i32 [ [[BC_RESUME_VAL]], %[[SCALAR_PH]] ], [ [[IV_NEXT:%.*]], %[[LOOP]] ]
32+
; CHECK-NEXT: [[P_GEP:%.*]] = getelementptr float, ptr [[P]], i32 [[IV]]
33+
; CHECK-NEXT: [[X:%.*]] = load float, ptr [[P_GEP]], align 4
34+
; CHECK-NEXT: [[Y:%.*]] = call float @llvm.powi.f32.i32(float [[X]], i32 [[POW]])
35+
; CHECK-NEXT: store float [[Y]], ptr [[P_GEP]], align 4
36+
; CHECK-NEXT: [[IV_NEXT]] = add i32 [[IV]], 1
37+
; CHECK-NEXT: [[DONE:%.*]] = icmp eq i32 [[IV_NEXT]], 1024
38+
; CHECK-NEXT: br i1 [[DONE]], label %[[EXIT]], label %[[LOOP]], !llvm.loop [[LOOP3:![0-9]+]]
39+
; CHECK: [[EXIT]]:
40+
; CHECK-NEXT: ret void
41+
;
42+
entry:
43+
br label %loop
44+
45+
loop:
46+
%iv = phi i32 [0, %entry], [%iv.next, %loop]
47+
%p.gep = getelementptr float, ptr %p, i32 %iv
48+
%x = load float, ptr %p.gep
49+
%y = call float @llvm.powi(float %x, i32 %pow)
50+
store float %y, ptr %p.gep
51+
%iv.next = add i32 %iv, 1
52+
%done = icmp eq i32 %iv.next, 1024
53+
br i1 %done, label %exit, label %loop
54+
55+
exit:
56+
ret void
57+
}

0 commit comments

Comments
 (0)