Skip to content

Commit df7eb20

Browse files
committed
[SLP][NFC]Add a test with incorrect final analysis for unsigned nodes, being used in signed nodes.
1 parent ee0284e commit df7eb20

File tree

1 file changed

+77
-0
lines changed

1 file changed

+77
-0
lines changed
Lines changed: 77 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,77 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
2+
; RUN: opt -S --passes=slp-vectorizer -mtriple=riscv64-unknown-linux -mattr=+v < %s | FileCheck %s
3+
4+
define void @test(ptr %p, i16 %load794) {
5+
; CHECK-LABEL: define void @test(
6+
; CHECK-SAME: ptr [[P:%.*]], i16 [[LOAD794:%.*]]) #[[ATTR0:[0-9]+]] {
7+
; CHECK-NEXT: [[ZEXT795:%.*]] = zext i16 [[LOAD794]] to i32
8+
; CHECK-NEXT: [[GEP799:%.*]] = getelementptr inbounds i8, ptr [[P]], i64 16
9+
; CHECK-NEXT: [[TMP1:%.*]] = load <2 x i16>, ptr [[P]], align 2
10+
; CHECK-NEXT: [[TMP2:%.*]] = load <2 x i16>, ptr [[GEP799]], align 2
11+
; CHECK-NEXT: [[TMP3:%.*]] = sub <2 x i16> [[TMP2]], [[TMP1]]
12+
; CHECK-NEXT: [[TMP4:%.*]] = add <2 x i16> [[TMP3]], <i16 3329, i16 3329>
13+
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <2 x i32> poison, i32 [[ZEXT795]], i32 0
14+
; CHECK-NEXT: [[TMP6:%.*]] = shufflevector <2 x i32> [[TMP5]], <2 x i32> poison, <2 x i32> zeroinitializer
15+
; CHECK-NEXT: [[TMP7:%.*]] = trunc <2 x i32> [[TMP6]] to <2 x i16>
16+
; CHECK-NEXT: [[TMP8:%.*]] = mul <2 x i16> [[TMP4]], [[TMP7]]
17+
; CHECK-NEXT: [[TMP9:%.*]] = zext <2 x i16> [[TMP8]] to <2 x i64>
18+
; CHECK-NEXT: [[TMP10:%.*]] = mul nuw nsw <2 x i64> [[TMP9]], <i64 5039, i64 5039>
19+
; CHECK-NEXT: [[TMP11:%.*]] = lshr <2 x i64> [[TMP10]], <i64 24, i64 24>
20+
; CHECK-NEXT: [[TMP12:%.*]] = trunc <2 x i64> [[TMP11]] to <2 x i16>
21+
; CHECK-NEXT: [[TMP13:%.*]] = mul <2 x i16> [[TMP12]], <i16 -3329, i16 -3329>
22+
; CHECK-NEXT: [[TMP14:%.*]] = add <2 x i16> [[TMP13]], [[TMP8]]
23+
; CHECK-NEXT: [[TMP15:%.*]] = add <2 x i16> [[TMP14]], <i16 -3329, i16 -3329>
24+
; CHECK-NEXT: [[TMP16:%.*]] = icmp slt <2 x i16> [[TMP15]], zeroinitializer
25+
; CHECK-NEXT: [[TMP17:%.*]] = select <2 x i1> [[TMP16]], <2 x i16> [[TMP14]], <2 x i16> zeroinitializer
26+
; CHECK-NEXT: [[TMP18:%.*]] = call <2 x i16> @llvm.smax.v2i16(<2 x i16> [[TMP15]], <2 x i16> zeroinitializer)
27+
; CHECK-NEXT: [[TMP19:%.*]] = or <2 x i16> [[TMP17]], [[TMP18]]
28+
; CHECK-NEXT: store <2 x i16> [[TMP19]], ptr [[P]], align 2
29+
; CHECK-NEXT: ret void
30+
;
31+
%zext795 = zext i16 %load794 to i32
32+
%load798 = load i16, ptr %p, align 2
33+
%gep799 = getelementptr inbounds i8, ptr %p, i64 16
34+
%load800 = load i16, ptr %gep799, align 2
35+
%zext801 = zext i16 %load798 to i32
36+
%zext802 = zext i16 %load800 to i32
37+
%sub809 = sub nsw i32 %zext802, %zext801
38+
%add810 = add nsw i32 %sub809, 3329
39+
%mul811 = mul i32 %add810, %zext795
40+
%zext812 = zext i32 %mul811 to i64
41+
%mul813 = mul nuw nsw i64 %zext812, 5039
42+
%lshr814 = lshr i64 %mul813, 24
43+
%trunc815 = trunc nuw nsw i64 %lshr814 to i32
44+
%mul816 = mul i32 %trunc815, 62207
45+
%add817 = add i32 %mul816, %mul811
46+
%trunc818 = trunc i32 %add817 to i16
47+
%add819 = add i16 %trunc818, -3329
48+
%icmp820 = icmp slt i16 %add819, 0
49+
%select821 = select i1 %icmp820, i16 %trunc818, i16 0
50+
%call822 = call i16 @llvm.smax.i16(i16 %add819, i16 0)
51+
%or823 = or i16 %select821, %call822
52+
store i16 %or823, ptr %p, align 2
53+
%gep826 = getelementptr inbounds i8, ptr %p, i64 2
54+
%load827 = load i16, ptr %gep826, align 2
55+
%gep828 = getelementptr inbounds i8, ptr %p, i64 18
56+
%load829 = load i16, ptr %gep828, align 2
57+
%zext830 = zext i16 %load827 to i32
58+
%zext831 = zext i16 %load829 to i32
59+
%sub838 = sub nsw i32 %zext831, %zext830
60+
%add839 = add nsw i32 %sub838, 3329
61+
%mul840 = mul i32 %add839, %zext795
62+
%zext841 = zext i32 %mul840 to i64
63+
%mul842 = mul nuw nsw i64 %zext841, 5039
64+
%lshr843 = lshr i64 %mul842, 24
65+
%trunc844 = trunc nuw nsw i64 %lshr843 to i32
66+
%mul845 = mul i32 %trunc844, 62207
67+
%add846 = add i32 %mul845, %mul840
68+
%trunc847 = trunc i32 %add846 to i16
69+
%add848 = add i16 %trunc847, -3329
70+
%icmp849 = icmp slt i16 %add848, 0
71+
%select850 = select i1 %icmp849, i16 %trunc847, i16 0
72+
%call851 = call i16 @llvm.smax.i16(i16 %add848, i16 0)
73+
%or852 = or i16 %select850, %call851
74+
store i16 %or852, ptr %gep826, align 2
75+
ret void
76+
}
77+

0 commit comments

Comments
 (0)