Skip to content

Commit 66bde5c

Browse files
committed
[X86][AVX] Updated fptosi_2f64_to_4i32 test to show missed opportunity to implicit zero the upper elements
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@279521 91177308-0d34-0410-b5e6-96231b3b80d8
1 parent 8479207 commit 66bde5c

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

test/CodeGen/X86/vec_fp_to_int.ll

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -62,7 +62,8 @@ define <4 x i32> @fptosi_2f64_to_4i32(<2 x double> %a) {
6262
; SSE-NEXT: cvttsd2si %xmm0, %rax
6363
; SSE-NEXT: movd %rax, %xmm0
6464
; SSE-NEXT: punpcklqdq {{.*#+}} xmm1 = xmm1[0],xmm0[0]
65-
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm1[0,2,2,3]
65+
; SSE-NEXT: pshufd {{.*#+}} xmm0 = xmm1[0,1,0,2]
66+
; SSE-NEXT: psrldq {{.*#+}} xmm0 = xmm0[8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,zero,zero,zero
6667
; SSE-NEXT: retq
6768
;
6869
; AVX-LABEL: fptosi_2f64_to_4i32:
@@ -74,6 +75,7 @@ define <4 x i32> @fptosi_2f64_to_4i32(<2 x double> %a) {
7475
; AVX-NEXT: vmovq %rax, %xmm0
7576
; AVX-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm1[0],xmm0[0]
7677
; AVX-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[0,2,2,3]
78+
; AVX-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero
7779
; AVX-NEXT: retq
7880
;
7981
; AVX512F-LABEL: fptosi_2f64_to_4i32:
@@ -85,15 +87,17 @@ define <4 x i32> @fptosi_2f64_to_4i32(<2 x double> %a) {
8587
; AVX512F-NEXT: vmovq %rax, %xmm0
8688
; AVX512F-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm1[0],xmm0[0]
8789
; AVX512F-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[0,2,2,3]
90+
; AVX512F-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero
8891
; AVX512F-NEXT: retq
8992
;
9093
; AVX512DQ-LABEL: fptosi_2f64_to_4i32:
9194
; AVX512DQ: # BB#0:
9295
; AVX512DQ-NEXT: vcvttpd2qq %xmm0, %xmm0
9396
; AVX512DQ-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[0,2,2,3]
97+
; AVX512DQ-NEXT: vmovq {{.*#+}} xmm0 = xmm0[0],zero
9498
; AVX512DQ-NEXT: retq
9599
%cvt = fptosi <2 x double> %a to <2 x i32>
96-
%ext = shufflevector <2 x i32> %cvt, <2 x i32> undef, <4 x i32> <i32 0, i32 1, i32 undef, i32 undef>
100+
%ext = shufflevector <2 x i32> %cvt, <2 x i32> zeroinitializer, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
97101
ret <4 x i32> %ext
98102
}
99103

0 commit comments

Comments
 (0)