1
1
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
2
- ; RUN: llc -mtriple=x86_64-unknown-unknown -mattr=+avx < %s | FileCheck %s --check-prefix=AVX
3
- ; RUN: llc -mtriple=i386-unknown-linux-gnu -mcpu=knl < %s | FileCheck %s --check-prefix=KNL-32
2
+ ; RUN: llc -mtriple=x86_64-unknown-unknown -mattr=+avx < %s | FileCheck %s --check-prefixes=AVX,AVX1
3
+ ; RUN: llc -mtriple=x86_64-unknown-unknown -mattr=+avx2 < %s | FileCheck %s --check-prefixes=AVX,AVX2
4
+ ; RUN: llc -mtriple=i386-unknown-linux-gnu -mcpu=knl < %s | FileCheck %s --check-prefixes=AVX,KNL-32
4
5
5
6
6
7
; Verify that we don't crash during codegen due to a wrong lowering
7
8
; of a setcc node with illegal operand types and return type.
8
9
9
10
define <8 x i16 > @pr25080 (<8 x i32 > %a ) {
10
- ; AVX-LABEL: pr25080:
11
- ; AVX: # %bb.0: # %entry
12
- ; AVX-NEXT: vextractf128 $1, %ymm0, %xmm0
13
- ; AVX-NEXT: vpand {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
14
- ; AVX-NEXT: vpxor %xmm1, %xmm1, %xmm1
15
- ; AVX-NEXT: vpcmpeqd %xmm1, %xmm0, %xmm0
16
- ; AVX-NEXT: vpackssdw %xmm0, %xmm0, %xmm0
17
- ; AVX-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
18
- ; AVX-NEXT: vzeroupper
19
- ; AVX-NEXT: retq
11
+ ; AVX1-LABEL: pr25080:
12
+ ; AVX1: # %bb.0: # %entry
13
+ ; AVX1-NEXT: vextractf128 $1, %ymm0, %xmm0
14
+ ; AVX1-NEXT: vpand {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
15
+ ; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1
16
+ ; AVX1-NEXT: vpcmpeqd %xmm1, %xmm0, %xmm0
17
+ ; AVX1-NEXT: vpackssdw %xmm0, %xmm0, %xmm0
18
+ ; AVX1-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
19
+ ; AVX1-NEXT: vzeroupper
20
+ ; AVX1-NEXT: retq
21
+ ;
22
+ ; AVX2-LABEL: pr25080:
23
+ ; AVX2: # %bb.0: # %entry
24
+ ; AVX2-NEXT: vpbroadcastd {{.*#+}} ymm1 = [8388607,8388607,8388607,8388607,8388607,8388607,8388607,8388607]
25
+ ; AVX2-NEXT: vpand %ymm1, %ymm0, %ymm0
26
+ ; AVX2-NEXT: vpxor %xmm1, %xmm1, %xmm1
27
+ ; AVX2-NEXT: vpcmpeqd %ymm1, %ymm0, %ymm0
28
+ ; AVX2-NEXT: vextracti128 $1, %ymm0, %xmm0
29
+ ; AVX2-NEXT: vpackssdw %xmm0, %xmm0, %xmm0
30
+ ; AVX2-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
31
+ ; AVX2-NEXT: vzeroupper
32
+ ; AVX2-NEXT: retq
20
33
;
21
34
; KNL-32-LABEL: pr25080:
22
35
; KNL-32: # %bb.0: # %entry
@@ -38,23 +51,40 @@ entry:
38
51
}
39
52
40
53
define void @pr26232 (i64 %a , <16 x i1 > %b ) {
41
- ; AVX-LABEL: pr26232:
42
- ; AVX: # %bb.0: # %allocas
43
- ; AVX-NEXT: vpxor %xmm1, %xmm1, %xmm1
44
- ; AVX-NEXT: .p2align 4, 0x90
45
- ; AVX-NEXT: .LBB1_1: # %for_loop599
46
- ; AVX-NEXT: # =>This Inner Loop Header: Depth=1
47
- ; AVX-NEXT: cmpq $65536, %rdi # imm = 0x10000
48
- ; AVX-NEXT: setl %al
49
- ; AVX-NEXT: vmovd %eax, %xmm2
50
- ; AVX-NEXT: vpshufb %xmm1, %xmm2, %xmm2
51
- ; AVX-NEXT: vpand %xmm0, %xmm2, %xmm2
52
- ; AVX-NEXT: vpsllw $7, %xmm2, %xmm2
53
- ; AVX-NEXT: vpmovmskb %xmm2, %eax
54
- ; AVX-NEXT: testl %eax, %eax
55
- ; AVX-NEXT: jne .LBB1_1
56
- ; AVX-NEXT: # %bb.2: # %for_exit600
57
- ; AVX-NEXT: retq
54
+ ; AVX1-LABEL: pr26232:
55
+ ; AVX1: # %bb.0: # %allocas
56
+ ; AVX1-NEXT: vpxor %xmm1, %xmm1, %xmm1
57
+ ; AVX1-NEXT: .p2align 4, 0x90
58
+ ; AVX1-NEXT: .LBB1_1: # %for_loop599
59
+ ; AVX1-NEXT: # =>This Inner Loop Header: Depth=1
60
+ ; AVX1-NEXT: cmpq $65536, %rdi # imm = 0x10000
61
+ ; AVX1-NEXT: setl %al
62
+ ; AVX1-NEXT: vmovd %eax, %xmm2
63
+ ; AVX1-NEXT: vpshufb %xmm1, %xmm2, %xmm2
64
+ ; AVX1-NEXT: vpand %xmm0, %xmm2, %xmm2
65
+ ; AVX1-NEXT: vpsllw $7, %xmm2, %xmm2
66
+ ; AVX1-NEXT: vpmovmskb %xmm2, %eax
67
+ ; AVX1-NEXT: testl %eax, %eax
68
+ ; AVX1-NEXT: jne .LBB1_1
69
+ ; AVX1-NEXT: # %bb.2: # %for_exit600
70
+ ; AVX1-NEXT: retq
71
+ ;
72
+ ; AVX2-LABEL: pr26232:
73
+ ; AVX2: # %bb.0: # %allocas
74
+ ; AVX2-NEXT: .p2align 4, 0x90
75
+ ; AVX2-NEXT: .LBB1_1: # %for_loop599
76
+ ; AVX2-NEXT: # =>This Inner Loop Header: Depth=1
77
+ ; AVX2-NEXT: cmpq $65536, %rdi # imm = 0x10000
78
+ ; AVX2-NEXT: setl %al
79
+ ; AVX2-NEXT: vmovd %eax, %xmm1
80
+ ; AVX2-NEXT: vpbroadcastb %xmm1, %xmm1
81
+ ; AVX2-NEXT: vpand %xmm0, %xmm1, %xmm1
82
+ ; AVX2-NEXT: vpsllw $7, %xmm1, %xmm1
83
+ ; AVX2-NEXT: vpmovmskb %xmm1, %eax
84
+ ; AVX2-NEXT: testl %eax, %eax
85
+ ; AVX2-NEXT: jne .LBB1_1
86
+ ; AVX2-NEXT: # %bb.2: # %for_exit600
87
+ ; AVX2-NEXT: retq
58
88
;
59
89
; KNL-32-LABEL: pr26232:
60
90
; KNL-32: # %bb.0: # %allocas
@@ -108,14 +138,7 @@ define <4 x i32> @pcmpgt(<4 x i8> %x) {
108
138
; AVX-NEXT: vpmovzxbd {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero
109
139
; AVX-NEXT: vpxor %xmm1, %xmm1, %xmm1
110
140
; AVX-NEXT: vpcmpgtd %xmm1, %xmm0, %xmm0
111
- ; AVX-NEXT: retq
112
- ;
113
- ; KNL-32-LABEL: pcmpgt:
114
- ; KNL-32: # %bb.0:
115
- ; KNL-32-NEXT: vpmovzxbd {{.*#+}} xmm0 = xmm0[0],zero,zero,zero,xmm0[1],zero,zero,zero,xmm0[2],zero,zero,zero,xmm0[3],zero,zero,zero
116
- ; KNL-32-NEXT: vpxor %xmm1, %xmm1, %xmm1
117
- ; KNL-32-NEXT: vpcmpgtd %xmm1, %xmm0, %xmm0
118
- ; KNL-32-NEXT: retl
141
+ ; AVX-NEXT: ret{{[l|q]}}
119
142
%zext = zext <4 x i8 > %x to <4 x i32 >
120
143
%icmp = icmp ne <4 x i32 > %zext , zeroinitializer
121
144
%sext = sext <4 x i1 > %icmp to <4 x i32 >
0 commit comments