Skip to content

Commit ffe05b8

Browse files
committed
[MCA][X86] Add missing IceLake test coverage for VPOPCNTDQ instructions
1 parent 4c85412 commit ffe05b8

File tree

2 files changed

+246
-0
lines changed

2 files changed

+246
-0
lines changed
Lines changed: 93 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,93 @@
1+
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2+
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=icelake-server -instruction-tables < %s | FileCheck %s
3+
4+
vpopcntd %zmm1, %zmm0
5+
vpopcntd (%rdi), %zmm0
6+
vpopcntd (%rdi){1to16}, %zmm0
7+
8+
vpopcntd %zmm1, %zmm0 {%k1}
9+
vpopcntd (%rdi), %zmm0 {%k1}
10+
vpopcntd (%rdi){1to16}, %zmm0 {%k1}
11+
12+
vpopcntd %zmm1, %zmm0 {%k1} {z}
13+
vpopcntd (%rdi), %zmm0 {%k1} {z}
14+
vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z}
15+
16+
vpopcntq %zmm1, %zmm0
17+
vpopcntq (%rdi), %zmm0
18+
vpopcntq (%rdi){1to8}, %zmm0
19+
20+
vpopcntq %zmm1, %zmm0 {%k1}
21+
vpopcntq (%rdi), %zmm0 {%k1}
22+
vpopcntq (%rdi){1to8}, %zmm0 {%k1}
23+
24+
vpopcntq %zmm1, %zmm0 {%k1} {z}
25+
vpopcntq (%rdi), %zmm0 {%k1} {z}
26+
vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z}
27+
28+
# CHECK: Instruction Info:
29+
# CHECK-NEXT: [1]: #uOps
30+
# CHECK-NEXT: [2]: Latency
31+
# CHECK-NEXT: [3]: RThroughput
32+
# CHECK-NEXT: [4]: MayLoad
33+
# CHECK-NEXT: [5]: MayStore
34+
# CHECK-NEXT: [6]: HasSideEffects (U)
35+
36+
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
37+
# CHECK-NEXT: 1 1 1.00 vpopcntd %zmm1, %zmm0
38+
# CHECK-NEXT: 2 8 1.00 * vpopcntd (%rdi), %zmm0
39+
# CHECK-NEXT: 2 8 1.00 * vpopcntd (%rdi){1to16}, %zmm0
40+
# CHECK-NEXT: 1 1 1.00 vpopcntd %zmm1, %zmm0 {%k1}
41+
# CHECK-NEXT: 2 8 1.00 * vpopcntd (%rdi), %zmm0 {%k1}
42+
# CHECK-NEXT: 2 8 1.00 * vpopcntd (%rdi){1to16}, %zmm0 {%k1}
43+
# CHECK-NEXT: 1 1 1.00 vpopcntd %zmm1, %zmm0 {%k1} {z}
44+
# CHECK-NEXT: 2 8 1.00 * vpopcntd (%rdi), %zmm0 {%k1} {z}
45+
# CHECK-NEXT: 2 8 1.00 * vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z}
46+
# CHECK-NEXT: 1 1 1.00 vpopcntq %zmm1, %zmm0
47+
# CHECK-NEXT: 2 8 1.00 * vpopcntq (%rdi), %zmm0
48+
# CHECK-NEXT: 2 8 1.00 * vpopcntq (%rdi){1to8}, %zmm0
49+
# CHECK-NEXT: 1 1 1.00 vpopcntq %zmm1, %zmm0 {%k1}
50+
# CHECK-NEXT: 2 8 1.00 * vpopcntq (%rdi), %zmm0 {%k1}
51+
# CHECK-NEXT: 2 8 1.00 * vpopcntq (%rdi){1to8}, %zmm0 {%k1}
52+
# CHECK-NEXT: 1 1 1.00 vpopcntq %zmm1, %zmm0 {%k1} {z}
53+
# CHECK-NEXT: 2 8 1.00 * vpopcntq (%rdi), %zmm0 {%k1} {z}
54+
# CHECK-NEXT: 2 8 1.00 * vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z}
55+
56+
# CHECK: Resources:
57+
# CHECK-NEXT: [0] - ICXDivider
58+
# CHECK-NEXT: [1] - ICXFPDivider
59+
# CHECK-NEXT: [2] - ICXPort0
60+
# CHECK-NEXT: [3] - ICXPort1
61+
# CHECK-NEXT: [4] - ICXPort2
62+
# CHECK-NEXT: [5] - ICXPort3
63+
# CHECK-NEXT: [6] - ICXPort4
64+
# CHECK-NEXT: [7] - ICXPort5
65+
# CHECK-NEXT: [8] - ICXPort6
66+
# CHECK-NEXT: [9] - ICXPort7
67+
# CHECK-NEXT: [10] - ICXPort8
68+
# CHECK-NEXT: [11] - ICXPort9
69+
70+
# CHECK: Resource pressure per iteration:
71+
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11]
72+
# CHECK-NEXT: - - 18.00 - 6.00 6.00 - - - - - -
73+
74+
# CHECK: Resource pressure by instruction:
75+
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions:
76+
# CHECK-NEXT: - - 1.00 - - - - - - - - - vpopcntd %zmm1, %zmm0
77+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntd (%rdi), %zmm0
78+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntd (%rdi){1to16}, %zmm0
79+
# CHECK-NEXT: - - 1.00 - - - - - - - - - vpopcntd %zmm1, %zmm0 {%k1}
80+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntd (%rdi), %zmm0 {%k1}
81+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntd (%rdi){1to16}, %zmm0 {%k1}
82+
# CHECK-NEXT: - - 1.00 - - - - - - - - - vpopcntd %zmm1, %zmm0 {%k1} {z}
83+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntd (%rdi), %zmm0 {%k1} {z}
84+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntd (%rdi){1to16}, %zmm0 {%k1} {z}
85+
# CHECK-NEXT: - - 1.00 - - - - - - - - - vpopcntq %zmm1, %zmm0
86+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntq (%rdi), %zmm0
87+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntq (%rdi){1to8}, %zmm0
88+
# CHECK-NEXT: - - 1.00 - - - - - - - - - vpopcntq %zmm1, %zmm0 {%k1}
89+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntq (%rdi), %zmm0 {%k1}
90+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntq (%rdi){1to8}, %zmm0 {%k1}
91+
# CHECK-NEXT: - - 1.00 - - - - - - - - - vpopcntq %zmm1, %zmm0 {%k1} {z}
92+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntq (%rdi), %zmm0 {%k1} {z}
93+
# CHECK-NEXT: - - 1.00 - 0.50 0.50 - - - - - - vpopcntq (%rdi){1to8}, %zmm0 {%k1} {z}
Lines changed: 153 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,153 @@
1+
# NOTE: Assertions have been autogenerated by utils/update_mca_test_checks.py
2+
# RUN: llvm-mca -mtriple=x86_64-unknown-unknown -mcpu=icelake-server -instruction-tables < %s | FileCheck %s
3+
4+
vpopcntd %xmm1, %xmm0
5+
vpopcntd (%rdi), %xmm0
6+
vpopcntd (%rdi){1to4}, %xmm0
7+
8+
vpopcntd %xmm1, %xmm0 {%k1}
9+
vpopcntd (%rdi), %xmm0 {%k1}
10+
vpopcntd (%rdi){1to4}, %xmm0 {%k1}
11+
12+
vpopcntd %xmm1, %xmm0 {%k1} {z}
13+
vpopcntd (%rdi), %xmm0 {%k1} {z}
14+
vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z}
15+
16+
vpopcntd %ymm1, %ymm0
17+
vpopcntd (%rdi), %ymm0
18+
vpopcntd (%rdi){1to8}, %ymm0
19+
20+
vpopcntd %ymm1, %ymm0 {%k1}
21+
vpopcntd (%rdi), %ymm0 {%k1}
22+
vpopcntd (%rdi){1to8}, %ymm0 {%k1}
23+
24+
vpopcntd %ymm1, %ymm0 {%k1} {z}
25+
vpopcntd (%rdi), %ymm0 {%k1} {z}
26+
vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z}
27+
28+
vpopcntq %xmm1, %xmm0
29+
vpopcntq (%rdi), %xmm0
30+
vpopcntq (%rdi){1to2}, %xmm0
31+
32+
vpopcntq %xmm1, %xmm0 {%k1}
33+
vpopcntq (%rdi), %xmm0 {%k1}
34+
vpopcntq (%rdi){1to2}, %xmm0 {%k1}
35+
36+
vpopcntq %xmm1, %xmm0 {%k1} {z}
37+
vpopcntq (%rdi), %xmm0 {%k1} {z}
38+
vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z}
39+
40+
vpopcntq %ymm1, %ymm0
41+
vpopcntq (%rdi), %ymm0
42+
vpopcntq (%rdi){1to4}, %ymm0
43+
44+
vpopcntq %ymm1, %ymm0 {%k1}
45+
vpopcntq (%rdi), %ymm0 {%k1}
46+
vpopcntq (%rdi){1to4}, %ymm0 {%k1}
47+
48+
vpopcntq %ymm1, %ymm0 {%k1} {z}
49+
vpopcntq (%rdi), %ymm0 {%k1} {z}
50+
vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z}
51+
52+
# CHECK: Instruction Info:
53+
# CHECK-NEXT: [1]: #uOps
54+
# CHECK-NEXT: [2]: Latency
55+
# CHECK-NEXT: [3]: RThroughput
56+
# CHECK-NEXT: [4]: MayLoad
57+
# CHECK-NEXT: [5]: MayStore
58+
# CHECK-NEXT: [6]: HasSideEffects (U)
59+
60+
# CHECK: [1] [2] [3] [4] [5] [6] Instructions:
61+
# CHECK-NEXT: 1 1 0.50 vpopcntd %xmm1, %xmm0
62+
# CHECK-NEXT: 2 7 0.50 * vpopcntd (%rdi), %xmm0
63+
# CHECK-NEXT: 2 7 0.50 * vpopcntd (%rdi){1to4}, %xmm0
64+
# CHECK-NEXT: 1 1 0.50 vpopcntd %xmm1, %xmm0 {%k1}
65+
# CHECK-NEXT: 2 7 0.50 * vpopcntd (%rdi), %xmm0 {%k1}
66+
# CHECK-NEXT: 2 7 0.50 * vpopcntd (%rdi){1to4}, %xmm0 {%k1}
67+
# CHECK-NEXT: 1 1 0.50 vpopcntd %xmm1, %xmm0 {%k1} {z}
68+
# CHECK-NEXT: 2 7 0.50 * vpopcntd (%rdi), %xmm0 {%k1} {z}
69+
# CHECK-NEXT: 2 7 0.50 * vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z}
70+
# CHECK-NEXT: 1 1 0.50 vpopcntd %ymm1, %ymm0
71+
# CHECK-NEXT: 2 8 0.50 * vpopcntd (%rdi), %ymm0
72+
# CHECK-NEXT: 2 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0
73+
# CHECK-NEXT: 1 1 0.50 vpopcntd %ymm1, %ymm0 {%k1}
74+
# CHECK-NEXT: 2 8 0.50 * vpopcntd (%rdi), %ymm0 {%k1}
75+
# CHECK-NEXT: 2 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0 {%k1}
76+
# CHECK-NEXT: 1 1 0.50 vpopcntd %ymm1, %ymm0 {%k1} {z}
77+
# CHECK-NEXT: 2 8 0.50 * vpopcntd (%rdi), %ymm0 {%k1} {z}
78+
# CHECK-NEXT: 2 8 0.50 * vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z}
79+
# CHECK-NEXT: 1 1 0.50 vpopcntq %xmm1, %xmm0
80+
# CHECK-NEXT: 2 7 0.50 * vpopcntq (%rdi), %xmm0
81+
# CHECK-NEXT: 2 7 0.50 * vpopcntq (%rdi){1to2}, %xmm0
82+
# CHECK-NEXT: 1 1 0.50 vpopcntq %xmm1, %xmm0 {%k1}
83+
# CHECK-NEXT: 2 7 0.50 * vpopcntq (%rdi), %xmm0 {%k1}
84+
# CHECK-NEXT: 2 7 0.50 * vpopcntq (%rdi){1to2}, %xmm0 {%k1}
85+
# CHECK-NEXT: 1 1 0.50 vpopcntq %xmm1, %xmm0 {%k1} {z}
86+
# CHECK-NEXT: 2 7 0.50 * vpopcntq (%rdi), %xmm0 {%k1} {z}
87+
# CHECK-NEXT: 2 7 0.50 * vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z}
88+
# CHECK-NEXT: 1 1 0.50 vpopcntq %ymm1, %ymm0
89+
# CHECK-NEXT: 2 8 0.50 * vpopcntq (%rdi), %ymm0
90+
# CHECK-NEXT: 2 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0
91+
# CHECK-NEXT: 1 1 0.50 vpopcntq %ymm1, %ymm0 {%k1}
92+
# CHECK-NEXT: 2 8 0.50 * vpopcntq (%rdi), %ymm0 {%k1}
93+
# CHECK-NEXT: 2 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0 {%k1}
94+
# CHECK-NEXT: 1 1 0.50 vpopcntq %ymm1, %ymm0 {%k1} {z}
95+
# CHECK-NEXT: 2 8 0.50 * vpopcntq (%rdi), %ymm0 {%k1} {z}
96+
# CHECK-NEXT: 2 8 0.50 * vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z}
97+
98+
# CHECK: Resources:
99+
# CHECK-NEXT: [0] - ICXDivider
100+
# CHECK-NEXT: [1] - ICXFPDivider
101+
# CHECK-NEXT: [2] - ICXPort0
102+
# CHECK-NEXT: [3] - ICXPort1
103+
# CHECK-NEXT: [4] - ICXPort2
104+
# CHECK-NEXT: [5] - ICXPort3
105+
# CHECK-NEXT: [6] - ICXPort4
106+
# CHECK-NEXT: [7] - ICXPort5
107+
# CHECK-NEXT: [8] - ICXPort6
108+
# CHECK-NEXT: [9] - ICXPort7
109+
# CHECK-NEXT: [10] - ICXPort8
110+
# CHECK-NEXT: [11] - ICXPort9
111+
112+
# CHECK: Resource pressure per iteration:
113+
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11]
114+
# CHECK-NEXT: - - 18.00 18.00 12.00 12.00 - - - - - -
115+
116+
# CHECK: Resource pressure by instruction:
117+
# CHECK-NEXT: [0] [1] [2] [3] [4] [5] [6] [7] [8] [9] [10] [11] Instructions:
118+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntd %xmm1, %xmm0
119+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi), %xmm0
120+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi){1to4}, %xmm0
121+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntd %xmm1, %xmm0 {%k1}
122+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi), %xmm0 {%k1}
123+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi){1to4}, %xmm0 {%k1}
124+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntd %xmm1, %xmm0 {%k1} {z}
125+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi), %xmm0 {%k1} {z}
126+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi){1to4}, %xmm0 {%k1} {z}
127+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntd %ymm1, %ymm0
128+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi), %ymm0
129+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi){1to8}, %ymm0
130+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntd %ymm1, %ymm0 {%k1}
131+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi), %ymm0 {%k1}
132+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi){1to8}, %ymm0 {%k1}
133+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntd %ymm1, %ymm0 {%k1} {z}
134+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi), %ymm0 {%k1} {z}
135+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntd (%rdi){1to8}, %ymm0 {%k1} {z}
136+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntq %xmm1, %xmm0
137+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi), %xmm0
138+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi){1to2}, %xmm0
139+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntq %xmm1, %xmm0 {%k1}
140+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi), %xmm0 {%k1}
141+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi){1to2}, %xmm0 {%k1}
142+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntq %xmm1, %xmm0 {%k1} {z}
143+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi), %xmm0 {%k1} {z}
144+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi){1to2}, %xmm0 {%k1} {z}
145+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntq %ymm1, %ymm0
146+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi), %ymm0
147+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi){1to4}, %ymm0
148+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntq %ymm1, %ymm0 {%k1}
149+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi), %ymm0 {%k1}
150+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi){1to4}, %ymm0 {%k1}
151+
# CHECK-NEXT: - - 0.50 0.50 - - - - - - - - vpopcntq %ymm1, %ymm0 {%k1} {z}
152+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi), %ymm0 {%k1} {z}
153+
# CHECK-NEXT: - - 0.50 0.50 0.50 0.50 - - - - - - vpopcntq (%rdi){1to4}, %ymm0 {%k1} {z}

0 commit comments

Comments
 (0)