@@ -1553,50 +1553,48 @@ define amdgpu_kernel void @ctpop_i16_in_br(ptr addrspace(1) %out, ptr addrspace(
1553
1553
; EG: ; %bb.0: ; %entry
1554
1554
; EG-NEXT: ALU 0, @20, KC0[], KC1[]
1555
1555
; EG-NEXT: TEX 0 @14
1556
- ; EG-NEXT: ALU_PUSH_BEFORE 6 , @21, KC0[], KC1[]
1556
+ ; EG-NEXT: ALU_PUSH_BEFORE 4 , @21, KC0[], KC1[]
1557
1557
; EG-NEXT: JUMP @7 POP:1
1558
- ; EG-NEXT: ALU 0, @28 , KC0[CB0:0-32], KC1[]
1558
+ ; EG-NEXT: ALU 0, @26 , KC0[CB0:0-32], KC1[]
1559
1559
; EG-NEXT: TEX 0 @16
1560
- ; EG-NEXT: ALU_POP_AFTER 1, @29 , KC0[], KC1[]
1561
- ; EG-NEXT: ALU_PUSH_BEFORE 2, @31 , KC0[CB0:0-32], KC1[]
1560
+ ; EG-NEXT: ALU_POP_AFTER 1, @27 , KC0[], KC1[]
1561
+ ; EG-NEXT: ALU_PUSH_BEFORE 2, @29 , KC0[CB0:0-32], KC1[]
1562
1562
; EG-NEXT: JUMP @11 POP:1
1563
1563
; EG-NEXT: TEX 0 @18
1564
- ; EG-NEXT: ALU_POP_AFTER 0, @34 , KC0[], KC1[]
1565
- ; EG-NEXT: ALU 11, @35 , KC0[], KC1[]
1564
+ ; EG-NEXT: ALU_POP_AFTER 0, @32 , KC0[], KC1[]
1565
+ ; EG-NEXT: ALU 11, @33 , KC0[], KC1[]
1566
1566
; EG-NEXT: MEM_RAT MSKOR T1.XW, T0.X
1567
1567
; EG-NEXT: CF_END
1568
1568
; EG-NEXT: Fetch clause starting at 14:
1569
- ; EG-NEXT: VTX_READ_16 T1 .X, T0 .X, 46, #3
1569
+ ; EG-NEXT: VTX_READ_16 T2 .X, T1 .X, 46, #3
1570
1570
; EG-NEXT: Fetch clause starting at 16:
1571
- ; EG-NEXT: VTX_READ_16 T1 .X, T1 .X, 2, #1
1571
+ ; EG-NEXT: VTX_READ_16 T0 .X, T0 .X, 2, #1
1572
1572
; EG-NEXT: Fetch clause starting at 18:
1573
- ; EG-NEXT: VTX_READ_16 T0.X, T0 .X, 44, #3
1573
+ ; EG-NEXT: VTX_READ_16 T0.X, T1 .X, 44, #3
1574
1574
; EG-NEXT: ALU clause starting at 20:
1575
- ; EG-NEXT: MOV * T0 .X, 0.0,
1575
+ ; EG-NEXT: MOV * T1 .X, 0.0,
1576
1576
; EG-NEXT: ALU clause starting at 21:
1577
- ; EG-NEXT: AND_INT * T0.W, T1.X, literal.x,
1578
- ; EG-NEXT: 65535(9.183409e-41), 0(0.000000e+00)
1579
- ; EG-NEXT: MOV T1.X, literal.x,
1577
+ ; EG-NEXT: MOV T0.X, literal.x,
1580
1578
; EG-NEXT: MOV T1.W, literal.y,
1581
- ; EG-NEXT: SETNE_INT * T0.W, PV.W , 0.0,
1579
+ ; EG-NEXT: SETNE_INT * T0.W, T2.X , 0.0,
1582
1580
; EG-NEXT: 0(0.000000e+00), 1(1.401298e-45)
1583
1581
; EG-NEXT: PRED_SETNE_INT * ExecMask,PredicateBit (MASKED), PS, 0.0,
1584
- ; EG-NEXT: ALU clause starting at 28 :
1585
- ; EG-NEXT: MOV * T1 .X, KC0[2].Z,
1586
- ; EG-NEXT: ALU clause starting at 29 :
1582
+ ; EG-NEXT: ALU clause starting at 26 :
1583
+ ; EG-NEXT: MOV * T0 .X, KC0[2].Z,
1584
+ ; EG-NEXT: ALU clause starting at 27 :
1587
1585
; EG-NEXT: MOV * T1.W, literal.x,
1588
1586
; EG-NEXT: 0(0.000000e+00), 0(0.000000e+00)
1589
- ; EG-NEXT: ALU clause starting at 31 :
1587
+ ; EG-NEXT: ALU clause starting at 29 :
1590
1588
; EG-NEXT: MOV T0.W, KC0[2].Y,
1591
1589
; EG-NEXT: SETE_INT * T1.W, T1.W, 0.0,
1592
1590
; EG-NEXT: PRED_SETE_INT * ExecMask,PredicateBit (MASKED), PS, 0.0,
1593
- ; EG-NEXT: ALU clause starting at 34 :
1594
- ; EG-NEXT: BCNT_INT * T1 .X, T0.X,
1595
- ; EG-NEXT: ALU clause starting at 35 :
1591
+ ; EG-NEXT: ALU clause starting at 32 :
1592
+ ; EG-NEXT: BCNT_INT * T0 .X, T0.X,
1593
+ ; EG-NEXT: ALU clause starting at 33 :
1596
1594
; EG-NEXT: LSHL * T1.W, T0.W, literal.x,
1597
1595
; EG-NEXT: 3(4.203895e-45), 0(0.000000e+00)
1598
1596
; EG-NEXT: AND_INT T1.W, PV.W, literal.x,
1599
- ; EG-NEXT: AND_INT * T2.W, T1 .X, literal.y,
1597
+ ; EG-NEXT: AND_INT * T2.W, T0 .X, literal.y,
1600
1598
; EG-NEXT: 24(3.363116e-44), 65535(9.183409e-41)
1601
1599
; EG-NEXT: LSHL T1.X, PS, PV.W,
1602
1600
; EG-NEXT: LSHL * T1.W, literal.x, PV.W,
0 commit comments