Skip to content

Commit 70d11ff

Browse files
committed
[X86] Add test coverage for #90847
1 parent a48ebb8 commit 70d11ff

File tree

1 file changed

+71
-0
lines changed

1 file changed

+71
-0
lines changed

llvm/test/CodeGen/X86/pr90847.ll

Lines changed: 71 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,71 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
2+
; RUN: llc < %s -mtriple=x86_64-- -mattr=+avx | FileCheck %s --check-prefixes=AVX1
3+
; RUN: llc < %s -mtriple=x86_64-- -mattr=+avx2 | FileCheck %s --check-prefixes=AVX2
4+
5+
; TODO: PR90847 - failure to peek through FREEZE(SETCC()) results in VPMOVSMSKB(TRUNC()) instead of VMOVMSKPS
6+
7+
define i32 @PR90847(<8 x float> %x) nounwind {
8+
; AVX1-LABEL: PR90847:
9+
; AVX1: # %bb.0: # %entry
10+
; AVX1-NEXT: vshufps {{.*#+}} ymm1 = ymm0[1,0,3,2,5,4,7,6]
11+
; AVX1-NEXT: vminps %ymm1, %ymm0, %ymm1
12+
; AVX1-NEXT: vshufpd {{.*#+}} ymm2 = ymm1[1,0,3,2]
13+
; AVX1-NEXT: vminps %ymm2, %ymm1, %ymm1
14+
; AVX1-NEXT: vperm2f128 {{.*#+}} ymm2 = ymm1[2,3,0,1]
15+
; AVX1-NEXT: vminps %ymm2, %ymm1, %ymm1
16+
; AVX1-NEXT: vcmpeqps %ymm0, %ymm1, %ymm0
17+
; AVX1-NEXT: vextractf128 $1, %ymm0, %xmm1
18+
; AVX1-NEXT: vpackssdw %xmm1, %xmm0, %xmm0
19+
; AVX1-NEXT: vpacksswb %xmm0, %xmm0, %xmm0
20+
; AVX1-NEXT: vpmovmskb %xmm0, %eax
21+
; AVX1-NEXT: testb %al, %al
22+
; AVX1-NEXT: je .LBB0_1
23+
; AVX1-NEXT: # %bb.2: # %cond.false
24+
; AVX1-NEXT: movzbl %al, %eax
25+
; AVX1-NEXT: rep bsfl %eax, %eax
26+
; AVX1-NEXT: vzeroupper
27+
; AVX1-NEXT: retq
28+
; AVX1-NEXT: .LBB0_1:
29+
; AVX1-NEXT: movl $32, %eax
30+
; AVX1-NEXT: vzeroupper
31+
; AVX1-NEXT: retq
32+
;
33+
; AVX2-LABEL: PR90847:
34+
; AVX2: # %bb.0: # %entry
35+
; AVX2-NEXT: vshufps {{.*#+}} ymm1 = ymm0[1,0,3,2,5,4,7,6]
36+
; AVX2-NEXT: vminps %ymm1, %ymm0, %ymm1
37+
; AVX2-NEXT: vshufpd {{.*#+}} ymm2 = ymm1[1,0,3,2]
38+
; AVX2-NEXT: vminps %ymm2, %ymm1, %ymm1
39+
; AVX2-NEXT: vpermpd {{.*#+}} ymm2 = ymm1[2,3,0,1]
40+
; AVX2-NEXT: vminps %ymm2, %ymm1, %ymm1
41+
; AVX2-NEXT: vcmpeqps %ymm0, %ymm1, %ymm0
42+
; AVX2-NEXT: vextractf128 $1, %ymm0, %xmm1
43+
; AVX2-NEXT: vpackssdw %xmm1, %xmm0, %xmm0
44+
; AVX2-NEXT: vpacksswb %xmm0, %xmm0, %xmm0
45+
; AVX2-NEXT: vpmovmskb %xmm0, %eax
46+
; AVX2-NEXT: testb %al, %al
47+
; AVX2-NEXT: je .LBB0_1
48+
; AVX2-NEXT: # %bb.2: # %cond.false
49+
; AVX2-NEXT: movzbl %al, %eax
50+
; AVX2-NEXT: rep bsfl %eax, %eax
51+
; AVX2-NEXT: vzeroupper
52+
; AVX2-NEXT: retq
53+
; AVX2-NEXT: .LBB0_1:
54+
; AVX2-NEXT: movl $32, %eax
55+
; AVX2-NEXT: vzeroupper
56+
; AVX2-NEXT: retq
57+
entry:
58+
%shuf1 = shufflevector <8 x float> %x, <8 x float> poison, <8 x i32> <i32 1, i32 0, i32 3, i32 2, i32 5, i32 4, i32 7, i32 6>
59+
%min1 = tail call noundef <8 x float> @llvm.x86.avx.min.ps.256(<8 x float> %x, <8 x float> %shuf1)
60+
%shuf2 = shufflevector <8 x float> %min1, <8 x float> poison, <8 x i32> <i32 2, i32 3, i32 0, i32 1, i32 6, i32 7, i32 4, i32 5>
61+
%min2 = tail call noundef <8 x float> @llvm.x86.avx.min.ps.256(<8 x float> %min1, <8 x float> %shuf2)
62+
%shuf3 = shufflevector <8 x float> %min2, <8 x float> poison, <8 x i32> <i32 4, i32 5, i32 6, i32 7, i32 0, i32 1, i32 2, i32 3>
63+
%min3 = tail call noundef <8 x float> @llvm.x86.avx.min.ps.256(<8 x float> %min2, <8 x float> %shuf3)
64+
%fcmp = fcmp oeq <8 x float> %min3, %x
65+
%mask = bitcast <8 x i1> %fcmp to i8
66+
%zext = zext i8 %mask to i32
67+
%cmp = icmp eq i8 %mask, 0
68+
%tz = tail call range(i32 0, 33) i32 @llvm.cttz.i32(i32 %zext, i1 false)
69+
%conv = select i1 %cmp, i32 undef, i32 %tz
70+
ret i32 %conv
71+
}

0 commit comments

Comments
 (0)