Skip to content

Commit 920c589

Browse files
committed
[SLP][NFC]Add a test with the mask translate after buildvector shuffle cost estimation
1 parent 513fa28 commit 920c589

File tree

1 file changed

+98
-0
lines changed

1 file changed

+98
-0
lines changed
Lines changed: 98 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,98 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 5
2+
; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s
3+
4+
define i16 @test(i16 %v1, i16 %v2) {
5+
; CHECK-LABEL: define i16 @test(
6+
; CHECK-SAME: i16 [[V1:%.*]], i16 [[V2:%.*]]) {
7+
; CHECK-NEXT: [[ENTRY:.*:]]
8+
; CHECK-NEXT: [[TMP0:%.*]] = insertelement <4 x i16> <i16 0, i16 0, i16 0, i16 poison>, i16 [[V2]], i32 3
9+
; CHECK-NEXT: [[TMP1:%.*]] = insertelement <4 x i16> <i16 0, i16 0, i16 0, i16 poison>, i16 [[V1]], i32 3
10+
; CHECK-NEXT: [[TMP2:%.*]] = or <4 x i16> [[TMP0]], [[TMP1]]
11+
; CHECK-NEXT: [[TMP3:%.*]] = and <4 x i16> [[TMP0]], [[TMP1]]
12+
; CHECK-NEXT: [[TMP4:%.*]] = shufflevector <4 x i16> [[TMP2]], <4 x i16> [[TMP3]], <4 x i32> <i32 0, i32 1, i32 2, i32 7>
13+
; CHECK-NEXT: [[TMP5:%.*]] = shufflevector <4 x i16> [[TMP1]], <4 x i16> poison, <2 x i32> <i32 0, i32 poison>
14+
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <2 x i16> [[TMP5]], i16 [[V2]], i32 1
15+
; CHECK-NEXT: [[TMP7:%.*]] = shufflevector <2 x i16> [[TMP6]], <2 x i16> poison, <4 x i32> <i32 0, i32 0, i32 0, i32 1>
16+
; CHECK-NEXT: [[TMP8:%.*]] = or <4 x i16> [[TMP7]], zeroinitializer
17+
; CHECK-NEXT: [[TMP9:%.*]] = and <4 x i16> [[TMP4]], zeroinitializer
18+
; CHECK-NEXT: [[TMP10:%.*]] = and <4 x i16> [[TMP9]], zeroinitializer
19+
; CHECK-NEXT: [[TMP11:%.*]] = icmp ne <4 x i16> [[TMP10]], zeroinitializer
20+
; CHECK-NEXT: [[TMP12:%.*]] = or <4 x i1> [[TMP11]], zeroinitializer
21+
; CHECK-NEXT: [[TMP13:%.*]] = or <4 x i16> [[TMP8]], zeroinitializer
22+
; CHECK-NEXT: [[TMP14:%.*]] = or <4 x i16> [[TMP13]], zeroinitializer
23+
; CHECK-NEXT: [[TMP15:%.*]] = or <4 x i16> [[TMP14]], zeroinitializer
24+
; CHECK-NEXT: [[TMP16:%.*]] = icmp ne <4 x i16> [[TMP15]], zeroinitializer
25+
; CHECK-NEXT: [[TMP17:%.*]] = or <4 x i1> zeroinitializer, [[TMP16]]
26+
; CHECK-NEXT: [[TMP18:%.*]] = or <4 x i1> [[TMP12]], [[TMP17]]
27+
; CHECK-NEXT: [[TMP19:%.*]] = extractelement <4 x i1> [[TMP18]], i32 2
28+
; CHECK-NEXT: [[TMP20:%.*]] = extractelement <4 x i1> [[TMP18]], i32 3
29+
; CHECK-NEXT: [[TMP21:%.*]] = or i1 [[TMP20]], [[TMP19]]
30+
; CHECK-NEXT: [[TMP22:%.*]] = extractelement <4 x i1> [[TMP18]], i32 1
31+
; CHECK-NEXT: [[TMP23:%.*]] = or i1 false, [[TMP22]]
32+
; CHECK-NEXT: [[TMP24:%.*]] = freeze <4 x i1> [[TMP18]]
33+
; CHECK-NEXT: [[TMP25:%.*]] = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> [[TMP24]])
34+
; CHECK-NEXT: [[SPEC_SELECT31:%.*]] = select i1 [[TMP25]], i32 0, i32 0
35+
; CHECK-NEXT: [[TMP26:%.*]] = extractelement <4 x i1> [[TMP18]], i32 0
36+
; CHECK-NEXT: [[TMP27:%.*]] = or i1 false, [[TMP26]]
37+
; CHECK-NEXT: store i32 [[SPEC_SELECT31]], ptr null, align 4
38+
; CHECK-NEXT: ret i16 0
39+
;
40+
entry:
41+
%0 = and i16 %v2, %v1
42+
%1 = and i16 %0, 0
43+
%2 = and i16 %1, 0
44+
%3 = icmp ne i16 %2, 0
45+
%.not5.not = or i1 %3, false
46+
%inc.1.1.i82.i.i = or i16 %v2, 0
47+
%inc.143.1.i98.i.i = or i16 0, 0
48+
%4 = or i16 %inc.1.1.i82.i.i, 0
49+
%5 = or i16 %4, 0
50+
%6 = or i16 %5, 0
51+
%7 = icmp ne i16 %6, 0
52+
%.not7.not = or i1 false, %7
53+
%8 = or i1 %.not5.not, %.not7.not
54+
%9 = and i16 0, %inc.143.1.i98.i.i
55+
%10 = and i16 %9, 0
56+
%11 = icmp ne i16 %10, 0
57+
%.not5.not.1 = or i1 %11, false
58+
%inc.143.i76.i.i.1 = or i16 %v1, 0
59+
%inc.143.1.i98.i.i.1 = or i16 0, 0
60+
%12 = or i16 0, %inc.143.i76.i.i.1
61+
%13 = or i16 %12, 0
62+
%14 = or i16 %13, 0
63+
%15 = icmp ne i16 %14, 0
64+
%.not7.not.1 = or i1 false, %15
65+
%16 = or i1 %.not5.not.1, %.not7.not.1
66+
%17 = or i1 %8, %16
67+
%18 = and i16 0, %inc.143.1.i98.i.i.1
68+
%19 = and i16 %18, 0
69+
%20 = icmp ne i16 %19, 0
70+
%.not5.not.2 = or i1 %20, false
71+
%inc.143.i76.i.i.2 = or i16 %v1, 0
72+
%inc.143.1.i98.i.i.2 = or i16 0, 0
73+
%21 = or i16 0, %inc.143.i76.i.i.2
74+
%22 = or i16 %21, 0
75+
%23 = or i16 %22, 0
76+
%24 = icmp ne i16 %23, 0
77+
%.not7.not.2 = or i1 false, %24
78+
%25 = or i1 %.not5.not.2, %.not7.not.2
79+
%26 = or i1 false, %25
80+
%27 = and i16 0, %inc.143.1.i98.i.i.2
81+
%28 = and i16 %27, 0
82+
%29 = icmp ne i16 %28, 0
83+
%.not5.not.3 = or i1 %29, false
84+
%inc.143.i76.i.i.3 = or i16 %v1, 0
85+
%30 = or i16 0, %inc.143.i76.i.i.3
86+
%31 = or i16 %30, 0
87+
%32 = or i16 %31, 0
88+
%33 = icmp ne i16 %32, 0
89+
%.not7.not.3 = or i1 false, %33
90+
%34 = or i1 %.not5.not.3, %.not7.not.3
91+
%35 = select i1 %34, i1 true, i1 %25
92+
%36 = select i1 %35, i1 true, i1 %16
93+
%37 = select i1 %36, i1 true, i1 %8
94+
%spec.select31 = select i1 %37, i32 0, i32 0
95+
%38 = or i1 false, %34
96+
store i32 %spec.select31, ptr null, align 4
97+
ret i16 0
98+
}

0 commit comments

Comments
 (0)