Skip to content

Commit 181b2c1

Browse files
committed
[SLP][NFC]Add a test for PR72202 to show a bug in a mask generation for
vectorized extractelements operands.
1 parent ac4868e commit 181b2c1

File tree

1 file changed

+53
-0
lines changed

1 file changed

+53
-0
lines changed
Lines changed: 53 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,53 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
2+
; RUN: opt -S --passes=slp-vectorizer -mtriple=x86_64-unknown-linux-gnu < %s | FileCheck %s
3+
4+
define double @test() {
5+
; CHECK-LABEL: define double @test() {
6+
; CHECK-NEXT: entry:
7+
; CHECK-NEXT: [[TMP0:%.*]] = load <2 x double>, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 5), align 8
8+
; CHECK-NEXT: [[TMP1:%.*]] = load <2 x double>, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 8), align 16
9+
; CHECK-NEXT: [[TMP2:%.*]] = shufflevector <2 x double> [[TMP0]], <2 x double> [[TMP1]], <2 x i32> <i32 1, i32 3>
10+
; CHECK-NEXT: [[TMP3:%.*]] = shufflevector <2 x double> [[TMP2]], <2 x double> poison, <4 x i32> <i32 0, i32 1, i32 poison, i32 poison>
11+
; CHECK-NEXT: [[TMP4:%.*]] = fmul <4 x double> zeroinitializer, [[TMP3]]
12+
; CHECK-NEXT: [[TMP5:%.*]] = call reassoc nsz double @llvm.vector.reduce.fadd.v4f64(double -0.000000e+00, <4 x double> [[TMP4]])
13+
; CHECK-NEXT: [[TMP6:%.*]] = fmul double [[TMP5]], 0.000000e+00
14+
; CHECK-NEXT: store double [[TMP6]], ptr null, align 16
15+
; CHECK-NEXT: br label [[BB:%.*]]
16+
; CHECK: bb:
17+
; CHECK-NEXT: [[TMP7:%.*]] = fmul <2 x double> [[TMP1]], zeroinitializer
18+
; CHECK-NEXT: [[TMP8:%.*]] = extractelement <2 x double> [[TMP7]], i32 0
19+
; CHECK-NEXT: [[TMP9:%.*]] = extractelement <2 x double> [[TMP7]], i32 1
20+
; CHECK-NEXT: [[TMP10:%.*]] = fadd double [[TMP8]], [[TMP9]]
21+
; CHECK-NEXT: [[TMP11:%.*]] = fmul <2 x double> [[TMP0]], zeroinitializer
22+
; CHECK-NEXT: [[TMP12:%.*]] = extractelement <2 x double> [[TMP11]], i32 1
23+
; CHECK-NEXT: [[TMP13:%.*]] = fadd double [[TMP12]], [[TMP10]]
24+
; CHECK-NEXT: [[TMP14:%.*]] = extractelement <2 x double> [[TMP11]], i32 0
25+
; CHECK-NEXT: [[TMP15:%.*]] = fadd double [[TMP14]], [[TMP13]]
26+
; CHECK-NEXT: ret double [[TMP15]]
27+
;
28+
entry:
29+
%0 = fmul double 0.000000e+00, 0.000000e+00
30+
%1 = fmul double 0.000000e+00, 0.000000e+00
31+
%2 = fadd reassoc nsz double %1, %0
32+
%3 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 5), align 8
33+
%4 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 6), align 16
34+
%5 = fmul double %4, 0.000000e+00
35+
%6 = fadd reassoc nsz double %5, %2
36+
%7 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 8), align 16
37+
%8 = load double, ptr getelementptr inbounds ([13 x double], ptr null, i64 0, i64 9), align 8
38+
%9 = fmul double %8, 0.000000e+00
39+
%10 = fadd reassoc nsz double %9, %6
40+
%11 = fmul double %10, 0.000000e+00
41+
store double %11, ptr null, align 16
42+
br label %bb
43+
44+
bb:
45+
%12 = fmul double %8, 0.000000e+00
46+
%13 = fmul double %7, 0.000000e+00
47+
%14 = fadd double %13, %12
48+
%15 = fmul double %4, 0.000000e+00
49+
%16 = fadd double %15, %14
50+
%17 = fmul double %3, 0.000000e+00
51+
%18 = fadd double %17, %16
52+
ret double %18
53+
}

0 commit comments

Comments
 (0)