Skip to content

Commit aed5e3b

Browse files
committed
[SLP][NFC]Add a test for delaying of insertelements vectorization, NFC.
1 parent 2efc8f8 commit aed5e3b

File tree

1 file changed

+45
-0
lines changed

1 file changed

+45
-0
lines changed
Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
2+
; RUN: opt -S -slp-vectorizer -mtriple x86_64-unknown-linux-gnu < %s | FileCheck %s
3+
4+
define <4 x double> @test(double* %p2, double %i1754, double %i1781, double %i1778) {
5+
; CHECK-LABEL: @test(
6+
; CHECK-NEXT: entry:
7+
; CHECK-NEXT: [[I1771:%.*]] = getelementptr inbounds double, double* [[P2:%.*]], i64 54
8+
; CHECK-NEXT: [[TMP0:%.*]] = insertelement <2 x double> poison, double [[I1754:%.*]], i32 0
9+
; CHECK-NEXT: [[TMP1:%.*]] = insertelement <2 x double> [[TMP0]], double [[I1778:%.*]], i32 1
10+
; CHECK-NEXT: [[TMP2:%.*]] = insertelement <2 x double> [[TMP0]], double [[I1754]], i32 1
11+
; CHECK-NEXT: [[TMP3:%.*]] = fmul fast <2 x double> [[TMP1]], [[TMP2]]
12+
; CHECK-NEXT: [[I1792:%.*]] = fmul fast double [[I1754]], [[I1781:%.*]]
13+
; CHECK-NEXT: [[TMP4:%.*]] = bitcast double* [[I1771]] to <2 x double>*
14+
; CHECK-NEXT: [[TMP5:%.*]] = load <2 x double>, <2 x double>* [[TMP4]], align 8
15+
; CHECK-NEXT: [[TMP6:%.*]] = insertelement <2 x double> [[TMP0]], double [[I1781]], i32 1
16+
; CHECK-NEXT: [[TMP7:%.*]] = fmul fast <2 x double> [[TMP5]], [[TMP6]]
17+
; CHECK-NEXT: [[TMP8:%.*]] = extractelement <2 x double> [[TMP7]], i32 0
18+
; CHECK-NEXT: [[TMP9:%.*]] = extractelement <2 x double> [[TMP7]], i32 1
19+
; CHECK-NEXT: [[TMP10:%.*]] = shufflevector <2 x double> [[TMP3]], <2 x double> poison, <4 x i32> <i32 0, i32 1, i32 undef, i32 undef>
20+
; CHECK-NEXT: [[TMP11:%.*]] = insertelement <4 x double> [[TMP10]], double [[I1792]], i32 2
21+
; CHECK-NEXT: [[TMP12:%.*]] = insertelement <4 x double> [[TMP11]], double [[TMP8]], i32 3
22+
; CHECK-NEXT: [[TMP13:%.*]] = insertelement <4 x double> <double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double poison>, double [[TMP9]], i32 3
23+
; CHECK-NEXT: [[TMP14:%.*]] = fadd fast <4 x double> [[TMP12]], [[TMP13]]
24+
; CHECK-NEXT: ret <4 x double> [[TMP14]]
25+
;
26+
entry:
27+
%i1771 = getelementptr inbounds double, double* %p2, i64 54
28+
%i1772 = load double, double* %i1771, align 8
29+
%i1773 = fmul fast double %i1772, %i1754
30+
%i1782 = fmul fast double %i1754, %i1754
31+
%i1783 = fadd fast double %i1782, 1.000000e+00
32+
%i1787 = fmul fast double %i1778, %i1754
33+
%i1788 = fadd fast double %i1787, 1.000000e+00
34+
%i1792 = fmul fast double %i1754, %i1781
35+
%i1793 = fadd fast double %i1792, 1.000000e+00
36+
%i1795 = getelementptr inbounds double, double* %p2, i64 55
37+
%i1796 = load double, double* %i1795, align 8
38+
%i1797 = fmul fast double %i1796, %i1781
39+
%i1798 = fadd fast double %i1773, %i1797
40+
%i1976 = insertelement <4 x double> zeroinitializer, double %i1783, i64 0
41+
%i1982 = insertelement <4 x double> %i1976, double %i1788, i64 1
42+
%i1988 = insertelement <4 x double> %i1982, double %i1793, i64 2
43+
%i1994 = insertelement <4 x double> %i1988, double %i1798, i64 3
44+
ret <4 x double> %i1994
45+
}

0 commit comments

Comments
 (0)