@@ -246,19 +246,19 @@ define i32 @PR43159(ptr %a0) {
246
246
; AVX2-LABEL: PR43159:
247
247
; AVX2: # %bb.0: # %entry
248
248
; AVX2-NEXT: vmovdqa (%rdi), %xmm0
249
- ; AVX2-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm1
250
- ; AVX2-NEXT: vpshufd {{.*#+}} xmm2 = xmm1[1,1,3,3]
251
- ; AVX2-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2
249
+ ; AVX2-NEXT: vpshufd {{.*#+}} xmm1 = xmm0[1,1,3,3]
252
250
; AVX2-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm1, %xmm1
253
- ; AVX2-NEXT: vpshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
254
- ; AVX2-NEXT: vpblendd {{.*#+}} xmm1 = xmm1[0],xmm2[1],xmm1[2],xmm2[3]
255
- ; AVX2-NEXT: vpsubd %xmm2, %xmm0, %xmm0
251
+ ; AVX2-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm2
252
+ ; AVX2-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2
253
+ ; AVX2-NEXT: vpshufd {{.*#+}} xmm2 = xmm2[1,1,3,3]
254
+ ; AVX2-NEXT: vpblendd {{.*#+}} xmm2 = xmm2[0],xmm1[1],xmm2[2],xmm1[3]
255
+ ; AVX2-NEXT: vpsubd %xmm1, %xmm0, %xmm0
256
256
; AVX2-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[1,1,3,3]
257
- ; AVX2-NEXT: vpbroadcastd {{.*#+}} xmm2 = [2147483648,2147483648,2147483648,2147483648]
258
- ; AVX2-NEXT: vpmuludq %xmm2 , %xmm0, %xmm0
259
- ; AVX2-NEXT: vpxor %xmm2 , %xmm2 , %xmm2
260
- ; AVX2-NEXT: vpblendd {{.*#+}} xmm0 = xmm2 [0],xmm0[1],xmm2 [2],xmm0[3]
261
- ; AVX2-NEXT: vpaddd %xmm1 , %xmm0, %xmm0
257
+ ; AVX2-NEXT: vpbroadcastd {{.*#+}} xmm1 = [2147483648,2147483648,2147483648,2147483648]
258
+ ; AVX2-NEXT: vpmuludq %xmm1 , %xmm0, %xmm0
259
+ ; AVX2-NEXT: vpxor %xmm1 , %xmm1 , %xmm1
260
+ ; AVX2-NEXT: vpblendd {{.*#+}} xmm0 = xmm1 [0],xmm0[1],xmm1 [2],xmm0[3]
261
+ ; AVX2-NEXT: vpaddd %xmm2 , %xmm0, %xmm0
262
262
; AVX2-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
263
263
; AVX2-NEXT: vmovd %xmm0, %edi
264
264
; AVX2-NEXT: vpextrd $1, %xmm0, %esi
@@ -269,19 +269,19 @@ define i32 @PR43159(ptr %a0) {
269
269
; AVX512VL-LABEL: PR43159:
270
270
; AVX512VL: # %bb.0: # %entry
271
271
; AVX512VL-NEXT: vmovdqa (%rdi), %xmm0
272
- ; AVX512VL-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm1
273
- ; AVX512VL-NEXT: vpshufd {{.*#+}} xmm2 = xmm1[1,1,3,3]
274
- ; AVX512VL-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2
272
+ ; AVX512VL-NEXT: vpshufd {{.*#+}} xmm1 = xmm0[1,1,3,3]
275
273
; AVX512VL-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm1, %xmm1
276
- ; AVX512VL-NEXT: vpshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
277
- ; AVX512VL-NEXT: vpblendd {{.*#+}} xmm1 = xmm1[0],xmm2[1],xmm1[2],xmm2[3]
278
- ; AVX512VL-NEXT: vpsubd %xmm2, %xmm0, %xmm0
274
+ ; AVX512VL-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm2
275
+ ; AVX512VL-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2
276
+ ; AVX512VL-NEXT: vpshufd {{.*#+}} xmm2 = xmm2[1,1,3,3]
277
+ ; AVX512VL-NEXT: vpblendd {{.*#+}} xmm2 = xmm2[0],xmm1[1],xmm2[2],xmm1[3]
278
+ ; AVX512VL-NEXT: vpsubd %xmm1, %xmm0, %xmm0
279
279
; AVX512VL-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[1,1,3,3]
280
- ; AVX512VL-NEXT: vpbroadcastd {{.*#+}} xmm2 = [2147483648,2147483648,2147483648,2147483648]
281
- ; AVX512VL-NEXT: vpmuludq %xmm2 , %xmm0, %xmm0
282
- ; AVX512VL-NEXT: vpxor %xmm2 , %xmm2 , %xmm2
283
- ; AVX512VL-NEXT: vpblendd {{.*#+}} xmm0 = xmm2 [0],xmm0[1],xmm2 [2],xmm0[3]
284
- ; AVX512VL-NEXT: vpaddd %xmm1 , %xmm0, %xmm0
280
+ ; AVX512VL-NEXT: vpbroadcastd {{.*#+}} xmm1 = [2147483648,2147483648,2147483648,2147483648]
281
+ ; AVX512VL-NEXT: vpmuludq %xmm1 , %xmm0, %xmm0
282
+ ; AVX512VL-NEXT: vpxor %xmm1 , %xmm1 , %xmm1
283
+ ; AVX512VL-NEXT: vpblendd {{.*#+}} xmm0 = xmm1 [0],xmm0[1],xmm1 [2],xmm0[3]
284
+ ; AVX512VL-NEXT: vpaddd %xmm2 , %xmm0, %xmm0
285
285
; AVX512VL-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
286
286
; AVX512VL-NEXT: vmovd %xmm0, %edi
287
287
; AVX512VL-NEXT: vpextrd $1, %xmm0, %esi
@@ -292,19 +292,19 @@ define i32 @PR43159(ptr %a0) {
292
292
; AVX512DQVL-LABEL: PR43159:
293
293
; AVX512DQVL: # %bb.0: # %entry
294
294
; AVX512DQVL-NEXT: vmovdqa (%rdi), %xmm0
295
- ; AVX512DQVL-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm1
296
- ; AVX512DQVL-NEXT: vpshufd {{.*#+}} xmm2 = xmm1[1,1,3,3]
297
- ; AVX512DQVL-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2
295
+ ; AVX512DQVL-NEXT: vpshufd {{.*#+}} xmm1 = xmm0[1,1,3,3]
298
296
; AVX512DQVL-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm1, %xmm1
299
- ; AVX512DQVL-NEXT: vpshufd {{.*#+}} xmm1 = xmm1[1,1,3,3]
300
- ; AVX512DQVL-NEXT: vpblendd {{.*#+}} xmm1 = xmm1[0],xmm2[1],xmm1[2],xmm2[3]
301
- ; AVX512DQVL-NEXT: vpsubd %xmm2, %xmm0, %xmm0
297
+ ; AVX512DQVL-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm2
298
+ ; AVX512DQVL-NEXT: vpmuludq {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm2
299
+ ; AVX512DQVL-NEXT: vpshufd {{.*#+}} xmm2 = xmm2[1,1,3,3]
300
+ ; AVX512DQVL-NEXT: vpblendd {{.*#+}} xmm2 = xmm2[0],xmm1[1],xmm2[2],xmm1[3]
301
+ ; AVX512DQVL-NEXT: vpsubd %xmm1, %xmm0, %xmm0
302
302
; AVX512DQVL-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[1,1,3,3]
303
- ; AVX512DQVL-NEXT: vpbroadcastd {{.*#+}} xmm2 = [2147483648,2147483648,2147483648,2147483648]
304
- ; AVX512DQVL-NEXT: vpmuludq %xmm2 , %xmm0, %xmm0
305
- ; AVX512DQVL-NEXT: vpxor %xmm2 , %xmm2 , %xmm2
306
- ; AVX512DQVL-NEXT: vpblendd {{.*#+}} xmm0 = xmm2 [0],xmm0[1],xmm2 [2],xmm0[3]
307
- ; AVX512DQVL-NEXT: vpaddd %xmm1 , %xmm0, %xmm0
303
+ ; AVX512DQVL-NEXT: vpbroadcastd {{.*#+}} xmm1 = [2147483648,2147483648,2147483648,2147483648]
304
+ ; AVX512DQVL-NEXT: vpmuludq %xmm1 , %xmm0, %xmm0
305
+ ; AVX512DQVL-NEXT: vpxor %xmm1 , %xmm1 , %xmm1
306
+ ; AVX512DQVL-NEXT: vpblendd {{.*#+}} xmm0 = xmm1 [0],xmm0[1],xmm1 [2],xmm0[3]
307
+ ; AVX512DQVL-NEXT: vpaddd %xmm2 , %xmm0, %xmm0
308
308
; AVX512DQVL-NEXT: vpsrlvd {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm0, %xmm0
309
309
; AVX512DQVL-NEXT: vmovd %xmm0, %edi
310
310
; AVX512DQVL-NEXT: vpextrd $1, %xmm0, %esi
0 commit comments