@@ -1498,55 +1498,66 @@ define <vscale x 16 x double> @vp_ceil_vv_nxv16f64(<vscale x 16 x double> %va, <
1498
1498
; CHECK-NEXT: addi sp, sp, -16
1499
1499
; CHECK-NEXT: .cfi_def_cfa_offset 16
1500
1500
; CHECK-NEXT: csrr a1, vlenb
1501
- ; CHECK-NEXT: slli a1, a1, 3
1501
+ ; CHECK-NEXT: slli a1, a1, 4
1502
1502
; CHECK-NEXT: sub sp, sp, a1
1503
- ; CHECK-NEXT: .cfi_escape 0x0f, 0x0d, 0x72, 0x00, 0x11, 0x10, 0x22, 0x11, 0x08 , 0x92, 0xa2, 0x38, 0x00, 0x1e, 0x22 # sp + 16 + 8 * vlenb
1503
+ ; CHECK-NEXT: .cfi_escape 0x0f, 0x0d, 0x72, 0x00, 0x11, 0x10, 0x22, 0x11, 0x10 , 0x92, 0xa2, 0x38, 0x00, 0x1e, 0x22 # sp + 16 + 16 * vlenb
1504
1504
; CHECK-NEXT: vsetvli a1, zero, e8, mf4, ta, ma
1505
- ; CHECK-NEXT: vmv1r.v v7, v0
1505
+ ; CHECK-NEXT: vmv1r.v v24, v0
1506
+ ; CHECK-NEXT: addi a1, sp, 16
1507
+ ; CHECK-NEXT: vs8r.v v8, (a1) # Unknown-size Folded Spill
1506
1508
; CHECK-NEXT: csrr a1, vlenb
1507
1509
; CHECK-NEXT: lui a2, %hi(.LCPI44_0)
1508
1510
; CHECK-NEXT: srli a3, a1, 3
1509
1511
; CHECK-NEXT: fld fa5, %lo(.LCPI44_0)(a2)
1510
1512
; CHECK-NEXT: sub a2, a0, a1
1511
- ; CHECK-NEXT: vslidedown.vx v6 , v0, a3
1513
+ ; CHECK-NEXT: vslidedown.vx v25 , v0, a3
1512
1514
; CHECK-NEXT: sltu a3, a0, a2
1513
1515
; CHECK-NEXT: addi a3, a3, -1
1514
1516
; CHECK-NEXT: and a2, a3, a2
1515
- ; CHECK-NEXT: vmv1r.v v0, v6
1517
+ ; CHECK-NEXT: vmv1r.v v0, v25
1516
1518
; CHECK-NEXT: vsetvli zero, a2, e64, m8, ta, ma
1517
- ; CHECK-NEXT: vfabs.v v24, v16, v0.t
1518
- ; CHECK-NEXT: addi a2, sp, 16
1519
- ; CHECK-NEXT: vs8r.v v24, (a2) # Unknown-size Folded Spill
1520
- ; CHECK-NEXT: vl8r.v v24, (a2) # Unknown-size Folded Reload
1519
+ ; CHECK-NEXT: vfabs.v v8, v16, v0.t
1521
1520
; CHECK-NEXT: vsetvli zero, zero, e64, m8, ta, mu
1522
- ; CHECK-NEXT: vmflt.vf v6, v24 , fa5, v0.t
1521
+ ; CHECK-NEXT: vmflt.vf v25, v8 , fa5, v0.t
1523
1522
; CHECK-NEXT: fsrmi a2, 3
1524
- ; CHECK-NEXT: vmv1r.v v0, v6
1523
+ ; CHECK-NEXT: vmv1r.v v0, v25
1525
1524
; CHECK-NEXT: vsetvli zero, zero, e64, m8, ta, ma
1526
- ; CHECK-NEXT: vfcvt.x.f.v v24 , v16, v0.t
1525
+ ; CHECK-NEXT: vfcvt.x.f.v v8 , v16, v0.t
1527
1526
; CHECK-NEXT: fsrm a2
1528
- ; CHECK-NEXT: vfcvt.f.x.v v24, v24 , v0.t
1527
+ ; CHECK-NEXT: vfcvt.f.x.v v8, v8 , v0.t
1529
1528
; CHECK-NEXT: vsetvli zero, zero, e64, m8, ta, mu
1530
- ; CHECK-NEXT: vfsgnj.vv v16, v24, v16, v0.t
1529
+ ; CHECK-NEXT: vfsgnj.vv v16, v8, v16, v0.t
1530
+ ; CHECK-NEXT: csrr a2, vlenb
1531
+ ; CHECK-NEXT: slli a2, a2, 3
1532
+ ; CHECK-NEXT: add a2, sp, a2
1533
+ ; CHECK-NEXT: addi a2, a2, 16
1534
+ ; CHECK-NEXT: vs8r.v v16, (a2) # Unknown-size Folded Spill
1531
1535
; CHECK-NEXT: bltu a0, a1, .LBB44_2
1532
1536
; CHECK-NEXT: # %bb.1:
1533
1537
; CHECK-NEXT: mv a0, a1
1534
1538
; CHECK-NEXT: .LBB44_2:
1535
- ; CHECK-NEXT: vmv1r.v v0, v7
1539
+ ; CHECK-NEXT: vmv1r.v v0, v24
1540
+ ; CHECK-NEXT: addi a1, sp, 16
1541
+ ; CHECK-NEXT: vl8r.v v8, (a1) # Unknown-size Folded Reload
1536
1542
; CHECK-NEXT: vsetvli zero, a0, e64, m8, ta, ma
1537
- ; CHECK-NEXT: vfabs.v v24 , v8, v0.t
1543
+ ; CHECK-NEXT: vfabs.v v16 , v8, v0.t
1538
1544
; CHECK-NEXT: vsetvli zero, zero, e64, m8, ta, mu
1539
- ; CHECK-NEXT: vmflt.vf v7, v24 , fa5, v0.t
1545
+ ; CHECK-NEXT: vmflt.vf v24, v16 , fa5, v0.t
1540
1546
; CHECK-NEXT: fsrmi a0, 3
1541
- ; CHECK-NEXT: vmv1r.v v0, v7
1547
+ ; CHECK-NEXT: vmv1r.v v0, v24
1542
1548
; CHECK-NEXT: vsetvli zero, zero, e64, m8, ta, ma
1543
- ; CHECK-NEXT: vfcvt.x.f.v v24 , v8, v0.t
1549
+ ; CHECK-NEXT: vfcvt.x.f.v v16 , v8, v0.t
1544
1550
; CHECK-NEXT: fsrm a0
1545
- ; CHECK-NEXT: vfcvt.f.x.v v24, v24 , v0.t
1551
+ ; CHECK-NEXT: vfcvt.f.x.v v16, v16 , v0.t
1546
1552
; CHECK-NEXT: vsetvli zero, zero, e64, m8, ta, mu
1547
- ; CHECK-NEXT: vfsgnj.vv v8, v24 , v8, v0.t
1553
+ ; CHECK-NEXT: vfsgnj.vv v8, v16 , v8, v0.t
1548
1554
; CHECK-NEXT: csrr a0, vlenb
1549
1555
; CHECK-NEXT: slli a0, a0, 3
1556
+ ; CHECK-NEXT: add a0, sp, a0
1557
+ ; CHECK-NEXT: addi a0, a0, 16
1558
+ ; CHECK-NEXT: vl8r.v v16, (a0) # Unknown-size Folded Reload
1559
+ ; CHECK-NEXT: csrr a0, vlenb
1560
+ ; CHECK-NEXT: slli a0, a0, 4
1550
1561
; CHECK-NEXT: add sp, sp, a0
1551
1562
; CHECK-NEXT: .cfi_def_cfa sp, 16
1552
1563
; CHECK-NEXT: addi sp, sp, 16
0 commit comments