@@ -956,8 +956,7 @@ define <2 x i64> @vec128_i64_signed_reg_reg(<2 x i64> %a1, <2 x i64> %a2) nounwi
956
956
; AVX1-FALLBACK: # %bb.0:
957
957
; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm2
958
958
; AVX1-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
959
- ; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm4
960
- ; AVX1-FALLBACK-NEXT: vblendvpd %xmm4, %xmm0, %xmm1, %xmm4
959
+ ; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm4
961
960
; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm1
962
961
; AVX1-FALLBACK-NEXT: vpsubq %xmm4, %xmm1, %xmm1
963
962
; AVX1-FALLBACK-NEXT: vpsrlq $1, %xmm1, %xmm2
@@ -976,8 +975,7 @@ define <2 x i64> @vec128_i64_signed_reg_reg(<2 x i64> %a1, <2 x i64> %a2) nounwi
976
975
; AVX2-FALLBACK: # %bb.0:
977
976
; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm2
978
977
; AVX2-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
979
- ; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm4
980
- ; AVX2-FALLBACK-NEXT: vblendvpd %xmm4, %xmm0, %xmm1, %xmm4
978
+ ; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm4
981
979
; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm1
982
980
; AVX2-FALLBACK-NEXT: vpsubq %xmm4, %xmm1, %xmm1
983
981
; AVX2-FALLBACK-NEXT: vpsrlq $1, %xmm1, %xmm2
@@ -1401,8 +1399,7 @@ define <2 x i64> @vec128_i64_signed_mem_reg(ptr %a1_addr, <2 x i64> %a2) nounwin
1401
1399
; AVX1-FALLBACK-NEXT: vmovdqa (%rdi), %xmm1
1402
1400
; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm2
1403
1401
; AVX1-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
1404
- ; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm4
1405
- ; AVX1-FALLBACK-NEXT: vblendvpd %xmm4, %xmm1, %xmm0, %xmm4
1402
+ ; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm4
1406
1403
; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm0
1407
1404
; AVX1-FALLBACK-NEXT: vpsubq %xmm4, %xmm0, %xmm0
1408
1405
; AVX1-FALLBACK-NEXT: vpsrlq $1, %xmm0, %xmm2
@@ -1422,8 +1419,7 @@ define <2 x i64> @vec128_i64_signed_mem_reg(ptr %a1_addr, <2 x i64> %a2) nounwin
1422
1419
; AVX2-FALLBACK-NEXT: vmovdqa (%rdi), %xmm1
1423
1420
; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm2
1424
1421
; AVX2-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
1425
- ; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm4
1426
- ; AVX2-FALLBACK-NEXT: vblendvpd %xmm4, %xmm1, %xmm0, %xmm4
1422
+ ; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm4
1427
1423
; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm0
1428
1424
; AVX2-FALLBACK-NEXT: vpsubq %xmm4, %xmm0, %xmm0
1429
1425
; AVX2-FALLBACK-NEXT: vpsrlq $1, %xmm0, %xmm2
@@ -1624,8 +1620,7 @@ define <2 x i64> @vec128_i64_signed_reg_mem(<2 x i64> %a1, ptr %a2_addr) nounwin
1624
1620
; AVX1-FALLBACK-NEXT: vmovdqa (%rdi), %xmm1
1625
1621
; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm2
1626
1622
; AVX1-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
1627
- ; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm4
1628
- ; AVX1-FALLBACK-NEXT: vblendvpd %xmm4, %xmm0, %xmm1, %xmm4
1623
+ ; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm4
1629
1624
; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm1
1630
1625
; AVX1-FALLBACK-NEXT: vpsubq %xmm4, %xmm1, %xmm1
1631
1626
; AVX1-FALLBACK-NEXT: vpsrlq $1, %xmm1, %xmm2
@@ -1645,8 +1640,7 @@ define <2 x i64> @vec128_i64_signed_reg_mem(<2 x i64> %a1, ptr %a2_addr) nounwin
1645
1640
; AVX2-FALLBACK-NEXT: vmovdqa (%rdi), %xmm1
1646
1641
; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm2
1647
1642
; AVX2-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
1648
- ; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm4
1649
- ; AVX2-FALLBACK-NEXT: vblendvpd %xmm4, %xmm0, %xmm1, %xmm4
1643
+ ; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm4
1650
1644
; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm1
1651
1645
; AVX2-FALLBACK-NEXT: vpsubq %xmm4, %xmm1, %xmm1
1652
1646
; AVX2-FALLBACK-NEXT: vpsrlq $1, %xmm1, %xmm2
@@ -1850,8 +1844,7 @@ define <2 x i64> @vec128_i64_signed_mem_mem(ptr %a1_addr, ptr %a2_addr) nounwind
1850
1844
; AVX1-FALLBACK-NEXT: vmovdqa (%rsi), %xmm1
1851
1845
; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm2
1852
1846
; AVX1-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
1853
- ; AVX1-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm4
1854
- ; AVX1-FALLBACK-NEXT: vblendvpd %xmm4, %xmm0, %xmm1, %xmm4
1847
+ ; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm4
1855
1848
; AVX1-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm1
1856
1849
; AVX1-FALLBACK-NEXT: vpsubq %xmm4, %xmm1, %xmm1
1857
1850
; AVX1-FALLBACK-NEXT: vpsrlq $1, %xmm1, %xmm2
@@ -1872,8 +1865,7 @@ define <2 x i64> @vec128_i64_signed_mem_mem(ptr %a1_addr, ptr %a2_addr) nounwind
1872
1865
; AVX2-FALLBACK-NEXT: vmovdqa (%rsi), %xmm1
1873
1866
; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm1, %xmm0, %xmm2
1874
1867
; AVX2-FALLBACK-NEXT: vpor {{\.?LCPI[0-9]+_[0-9]+}}(%rip), %xmm2, %xmm3
1875
- ; AVX2-FALLBACK-NEXT: vpcmpgtq %xmm0, %xmm1, %xmm4
1876
- ; AVX2-FALLBACK-NEXT: vblendvpd %xmm4, %xmm0, %xmm1, %xmm4
1868
+ ; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm1, %xmm0, %xmm4
1877
1869
; AVX2-FALLBACK-NEXT: vblendvpd %xmm2, %xmm0, %xmm1, %xmm1
1878
1870
; AVX2-FALLBACK-NEXT: vpsubq %xmm4, %xmm1, %xmm1
1879
1871
; AVX2-FALLBACK-NEXT: vpsrlq $1, %xmm1, %xmm2
0 commit comments