|
| 1 | +; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py UTC_ARGS: --version 4 |
| 2 | +; RUN: llc < %s -mtriple=x86_64-- -mcpu=btver2 | FileCheck %s |
| 3 | + |
| 4 | +; FIXME: Should be vpmovzxbq[128,1] instead of vpmovzxbd[128,1,0,0] |
| 5 | +define i64 @PR81136(i32 %a0, i32 %a1, ptr %a2) { |
| 6 | +; CHECK-LABEL: PR81136: |
| 7 | +; CHECK: # %bb.0: |
| 8 | +; CHECK-NEXT: vmovd %edi, %xmm0 |
| 9 | +; CHECK-NEXT: vmovd %esi, %xmm1 |
| 10 | +; CHECK-NEXT: vmovdqa (%rdx), %ymm2 |
| 11 | +; CHECK-NEXT: vpxor %xmm3, %xmm3, %xmm3 |
| 12 | +; CHECK-NEXT: vpmovzxbd {{.*#+}} xmm4 = [128,1,0,0] |
| 13 | +; CHECK-NEXT: vpcmpgtq %xmm3, %xmm4, %xmm4 |
| 14 | +; CHECK-NEXT: vpcmpgtw %xmm0, %xmm1, %xmm0 |
| 15 | +; CHECK-NEXT: vpcmpeqd %xmm1, %xmm1, %xmm1 |
| 16 | +; CHECK-NEXT: vpxor %xmm1, %xmm0, %xmm0 |
| 17 | +; CHECK-NEXT: vpmovsxwq %xmm0, %xmm0 |
| 18 | +; CHECK-NEXT: vpalignr {{.*#+}} xmm0 = mem[8,9,10,11,12,13,14,15],xmm0[0,1,2,3,4,5,6,7] |
| 19 | +; CHECK-NEXT: vpcmpeqq %xmm3, %xmm0, %xmm0 |
| 20 | +; CHECK-NEXT: vpxor %xmm1, %xmm0, %xmm0 |
| 21 | +; CHECK-NEXT: vpcmpeqq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm1 |
| 22 | +; CHECK-NEXT: vextractf128 $1, %ymm2, %xmm2 |
| 23 | +; CHECK-NEXT: vpcmpeqq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2 |
| 24 | +; CHECK-NEXT: vinsertf128 $1, %xmm0, %ymm4, %ymm0 |
| 25 | +; CHECK-NEXT: vinsertf128 $1, %xmm2, %ymm1, %ymm1 |
| 26 | +; CHECK-NEXT: vandnpd %ymm0, %ymm1, %ymm0 |
| 27 | +; CHECK-NEXT: vmovmskpd %ymm0, %eax |
| 28 | +; CHECK-NEXT: popcntl %eax, %eax |
| 29 | +; CHECK-NEXT: negq %rax |
| 30 | +; CHECK-NEXT: retq |
| 31 | + %v0 = bitcast i32 %a0 to <2 x i16> |
| 32 | + %v1 = bitcast i32 %a1 to <2 x i16> |
| 33 | + %cmp15 = icmp sle <2 x i16> %v1, %v0 |
| 34 | + %conv16 = sext <2 x i1> %cmp15 to <2 x i64> |
| 35 | + %shuffle29 = shufflevector <2 x i64> %conv16, <2 x i64> <i64 128, i64 1>, <4 x i32> <i32 2, i32 3, i32 3, i32 0> |
| 36 | + %data = load volatile <4 x i64>, ptr %a2, align 32 |
| 37 | + %cmp65 = icmp ne <4 x i64> %data, <i64 -2071602529, i64 -1537047284, i64 717942021, i64 597457239> |
| 38 | + %cmp67 = icmp ne <4 x i64> %shuffle29, zeroinitializer |
| 39 | + %and = and <4 x i1> %cmp65, %cmp67 |
| 40 | + %mask = bitcast <4 x i1> %and to i4 |
| 41 | + %cnt = tail call i4 @llvm.ctpop.i4(i4 %mask) |
| 42 | + %cntz = zext i4 %cnt to i64 |
| 43 | + %res = sub nsw i64 0, %cntz |
| 44 | + ret i64 %res |
| 45 | +} |
| 46 | +declare i4 @llvm.ctpop.i4(i4) |
0 commit comments