Skip to content

Commit e83c6dd

Browse files
committed
[SLP][NFC]Add a test with the non profitable masked gather loads.
1 parent e22ce61 commit e83c6dd

File tree

1 file changed

+35
-0
lines changed

1 file changed

+35
-0
lines changed
Lines changed: 35 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,35 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
2+
; RUN: opt -S --passes=slp-vectorizer -mtriple=riscv64-unknown-linux -mattr=+v < %s | FileCheck %s
3+
4+
define void @test(ptr noalias %p, ptr %p1) {
5+
; CHECK-LABEL: define void @test(
6+
; CHECK-SAME: ptr noalias [[P:%.*]], ptr [[P1:%.*]]) #[[ATTR0:[0-9]+]] {
7+
; CHECK-NEXT: [[GEP799:%.*]] = getelementptr inbounds i8, ptr [[P]], i64 16
8+
; CHECK-NEXT: [[L3:%.*]] = load i16, ptr [[GEP799]], align 2
9+
; CHECK-NEXT: [[GEP3:%.*]] = getelementptr inbounds i8, ptr [[P]], i64 18
10+
; CHECK-NEXT: [[L4:%.*]] = load i16, ptr [[GEP3]], align 2
11+
; CHECK-NEXT: [[TMP1:%.*]] = load <2 x i16>, ptr [[P]], align 2
12+
; CHECK-NEXT: store <2 x i16> [[TMP1]], ptr [[P1]], align 2
13+
; CHECK-NEXT: [[GEPS2:%.*]] = getelementptr inbounds i8, ptr [[P1]], i64 4
14+
; CHECK-NEXT: store i16 [[L3]], ptr [[GEPS2]], align 2
15+
; CHECK-NEXT: [[GEPS3:%.*]] = getelementptr inbounds i8, ptr [[P1]], i64 6
16+
; CHECK-NEXT: store i16 [[L4]], ptr [[GEPS3]], align 2
17+
; CHECK-NEXT: ret void
18+
;
19+
%l1 = load i16, ptr %p, align 2
20+
%gep1 = getelementptr inbounds i8, ptr %p, i64 2
21+
%l2 = load i16, ptr %gep1, align 2
22+
%gep2 = getelementptr inbounds i8, ptr %p, i64 16
23+
%l3 = load i16, ptr %gep2, align 2
24+
%gep3 = getelementptr inbounds i8, ptr %p, i64 18
25+
%l4 = load i16, ptr %gep3, align 2
26+
store i16 %l1, ptr %p1, align 2
27+
%geps1 = getelementptr inbounds i8, ptr %p1, i64 2
28+
store i16 %l2, ptr %geps1, align 2
29+
%geps2 = getelementptr inbounds i8, ptr %p1, i64 4
30+
store i16 %l3, ptr %geps2, align 2
31+
%geps3 = getelementptr inbounds i8, ptr %p1, i64 6
32+
store i16 %l4, ptr %geps3, align 2
33+
ret void
34+
}
35+

0 commit comments

Comments
 (0)