Skip to content

Commit eb85c8e

Browse files
committed
[X86] Add test case for llvm#81136
1 parent b846613 commit eb85c8e

File tree

1 file changed

+46
-0
lines changed

1 file changed

+46
-0
lines changed

llvm/test/CodeGen/X86/pr81136.ll

Lines changed: 46 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,46 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4
2+
; RUN: llc < %s -mtriple=x86_64-- -mcpu=btver2 | FileCheck %s
3+
4+
; FIXME: Should be vpmovzxbq[128,1] instead of vpmovzxbd[128,1,0,0]
5+
define i64 @PR81136(i32 %a0, i32 %a1, ptr %a2) {
6+
; CHECK-LABEL: PR81136:
7+
; CHECK: # %bb.0:
8+
; CHECK-NEXT: vmovd %edi, %xmm0
9+
; CHECK-NEXT: vmovd %esi, %xmm1
10+
; CHECK-NEXT: vmovdqa (%rdx), %ymm2
11+
; CHECK-NEXT: vpxor %xmm3, %xmm3, %xmm3
12+
; CHECK-NEXT: vpmovzxbd {{.*#+}} xmm4 = [128,1,0,0]
13+
; CHECK-NEXT: vpcmpgtq %xmm3, %xmm4, %xmm4
14+
; CHECK-NEXT: vpcmpgtw %xmm0, %xmm1, %xmm0
15+
; CHECK-NEXT: vpcmpeqd %xmm1, %xmm1, %xmm1
16+
; CHECK-NEXT: vpxor %xmm1, %xmm0, %xmm0
17+
; CHECK-NEXT: vpmovsxwq %xmm0, %xmm0
18+
; CHECK-NEXT: vpalignr {{.*#+}} xmm0 = mem[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7]
19+
; CHECK-NEXT: vpcmpeqq %xmm3, %xmm0, %xmm0
20+
; CHECK-NEXT: vpxor %xmm1, %xmm0, %xmm0
21+
; CHECK-NEXT: vpcmpeqq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm1
22+
; CHECK-NEXT: vextractf128 $1, %ymm2, %xmm2
23+
; CHECK-NEXT: vpcmpeqq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2
24+
; CHECK-NEXT: vinsertf128 $1, %xmm0, %ymm4, %ymm0
25+
; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm1, %ymm1
26+
; CHECK-NEXT: vandnpd %ymm0, %ymm1, %ymm0
27+
; CHECK-NEXT: vmovmskpd %ymm0, %eax
28+
; CHECK-NEXT: popcntl %eax, %eax
29+
; CHECK-NEXT: negq %rax
30+
; CHECK-NEXT: retq
31+
%v0 = bitcast i32 %a0 to <2 x i16>
32+
%v1 = bitcast i32 %a1 to <2 x i16>
33+
%cmp15 = icmp sle <2 x i16> %v1, %v0
34+
%conv16 = sext <2 x i1> %cmp15 to <2 x i64>
35+
%shuffle29 = shufflevector <2 x i64> %conv16, <2 x i64> <i64 128, i64 1>, <4 x i32> <i32 2, i32 3, i32 3, i32 0>
36+
%data = load volatile <4 x i64>, ptr %a2, align 32
37+
%cmp65 = icmp ne <4 x i64> %data, <i64 -2071602529, i64 -1537047284, i64 717942021, i64 597457239>
38+
%cmp67 = icmp ne <4 x i64> %shuffle29, zeroinitializer
39+
%and = and <4 x i1> %cmp65, %cmp67
40+
%mask = bitcast <4 x i1> %and to i4
41+
%cnt = tail call i4 @llvm.ctpop.i4(i4 %mask)
42+
%cntz = zext i4 %cnt to i64
43+
%res = sub nsw i64 0, %cntz
44+
ret i64 %res
45+
}
46+
declare i4 @llvm.ctpop.i4(i4)

0 commit comments

Comments
 (0)