@@ -253,37 +253,39 @@ define void @fhalf(<vscale x 8 x half> %v) #1{
253
253
; PAIR-NEXT: str p8, [sp, #11, mul vl] // 2-byte Folded Spill
254
254
; PAIR-NEXT: ptrue pn8.b
255
255
; PAIR-NEXT: str p15, [sp, #4, mul vl] // 2-byte Folded Spill
256
- ; PAIR-NEXT: st1b { z22.b, z23.b }, pn8, [sp, #4 , mul vl] // 32-byte Folded Spill
257
- ; PAIR-NEXT: st1b { z20.b, z21.b }, pn8, [sp, #8 , mul vl] // 32-byte Folded Spill
256
+ ; PAIR-NEXT: st1b { z22.b, z23.b }, pn8, [sp, #2 , mul vl] // 32-byte Folded Spill
257
+ ; PAIR-NEXT: st1b { z20.b, z21.b }, pn8, [sp, #4 , mul vl] // 32-byte Folded Spill
258
258
; PAIR-NEXT: str p14, [sp, #5, mul vl] // 2-byte Folded Spill
259
- ; PAIR-NEXT: st1b { z18.b, z19.b }, pn8, [sp, #12 , mul vl] // 32-byte Folded Spill
260
- ; PAIR-NEXT: st1b { z16.b, z17.b }, pn8, [sp, #16 , mul vl] // 32-byte Folded Spill
259
+ ; PAIR-NEXT: st1b { z18.b, z19.b }, pn8, [sp, #6 , mul vl] // 32-byte Folded Spill
260
+ ; PAIR-NEXT: st1b { z16.b, z17.b }, pn8, [sp, #8 , mul vl] // 32-byte Folded Spill
261
261
; PAIR-NEXT: str p13, [sp, #6, mul vl] // 2-byte Folded Spill
262
- ; PAIR-NEXT: st1b { z14.b, z15.b }, pn8, [sp, #20 , mul vl] // 32-byte Folded Spill
263
- ; PAIR-NEXT: st1b { z12.b, z13.b }, pn8, [sp, #24 , mul vl] // 32-byte Folded Spill
262
+ ; PAIR-NEXT: st1b { z14.b, z15.b }, pn8, [sp, #10 , mul vl] // 32-byte Folded Spill
263
+ ; PAIR-NEXT: st1b { z12.b, z13.b }, pn8, [sp, #12 , mul vl] // 32-byte Folded Spill
264
264
; PAIR-NEXT: str p12, [sp, #7, mul vl] // 2-byte Folded Spill
265
- ; PAIR-NEXT: st1b { z10.b, z11.b }, pn8, [sp, #28 , mul vl] // 32-byte Folded Spill
265
+ ; PAIR-NEXT: st1b { z10.b, z11.b }, pn8, [sp, #14 , mul vl] // 32-byte Folded Spill
266
266
; PAIR-NEXT: str p11, [sp, #8, mul vl] // 2-byte Folded Spill
267
267
; PAIR-NEXT: str p10, [sp, #9, mul vl] // 2-byte Folded Spill
268
268
; PAIR-NEXT: str p9, [sp, #10, mul vl] // 2-byte Folded Spill
269
269
; PAIR-NEXT: str p7, [sp, #12, mul vl] // 2-byte Folded Spill
270
270
; PAIR-NEXT: str p6, [sp, #13, mul vl] // 2-byte Folded Spill
271
271
; PAIR-NEXT: str p5, [sp, #14, mul vl] // 2-byte Folded Spill
272
272
; PAIR-NEXT: str p4, [sp, #15, mul vl] // 2-byte Folded Spill
273
- ; PAIR-NEXT: st1b { z8.b, z9.b }, pn8, [sp, #32, mul vl] // 32-byte Folded Spill
273
+ ; PAIR-NEXT: str z9, [sp, #16, mul vl] // 16-byte Folded Spill
274
+ ; PAIR-NEXT: str z8, [sp, #17, mul vl] // 16-byte Folded Spill
274
275
; PAIR-NEXT: smstop sm
275
276
; PAIR-NEXT: bl my_func
276
277
; PAIR-NEXT: smstart sm
277
278
; PAIR-NEXT: ptrue pn8.b
279
+ ; PAIR-NEXT: ldr z9, [sp, #16, mul vl] // 16-byte Folded Reload
280
+ ; PAIR-NEXT: ldr z8, [sp, #17, mul vl] // 16-byte Folded Reload
281
+ ; PAIR-NEXT: ld1b { z22.b, z23.b }, pn8/z, [sp, #2, mul vl] // 32-byte Folded Reload
282
+ ; PAIR-NEXT: ld1b { z20.b, z21.b }, pn8/z, [sp, #4, mul vl] // 32-byte Folded Reload
283
+ ; PAIR-NEXT: ld1b { z18.b, z19.b }, pn8/z, [sp, #6, mul vl] // 32-byte Folded Reload
284
+ ; PAIR-NEXT: ld1b { z16.b, z17.b }, pn8/z, [sp, #8, mul vl] // 32-byte Folded Reload
285
+ ; PAIR-NEXT: ld1b { z14.b, z15.b }, pn8/z, [sp, #10, mul vl] // 32-byte Folded Reload
286
+ ; PAIR-NEXT: ld1b { z12.b, z13.b }, pn8/z, [sp, #12, mul vl] // 32-byte Folded Reload
287
+ ; PAIR-NEXT: ld1b { z10.b, z11.b }, pn8/z, [sp, #14, mul vl] // 32-byte Folded Reload
278
288
; PAIR-NEXT: ldr p15, [sp, #4, mul vl] // 2-byte Folded Reload
279
- ; PAIR-NEXT: ld1b { z22.b, z23.b }, pn8/z, [sp, #4, mul vl] // 32-byte Folded Reload
280
- ; PAIR-NEXT: ld1b { z20.b, z21.b }, pn8/z, [sp, #8, mul vl] // 32-byte Folded Reload
281
- ; PAIR-NEXT: ld1b { z18.b, z19.b }, pn8/z, [sp, #12, mul vl] // 32-byte Folded Reload
282
- ; PAIR-NEXT: ld1b { z16.b, z17.b }, pn8/z, [sp, #16, mul vl] // 32-byte Folded Reload
283
- ; PAIR-NEXT: ld1b { z14.b, z15.b }, pn8/z, [sp, #20, mul vl] // 32-byte Folded Reload
284
- ; PAIR-NEXT: ld1b { z12.b, z13.b }, pn8/z, [sp, #24, mul vl] // 32-byte Folded Reload
285
- ; PAIR-NEXT: ld1b { z10.b, z11.b }, pn8/z, [sp, #28, mul vl] // 32-byte Folded Reload
286
- ; PAIR-NEXT: ld1b { z8.b, z9.b }, pn8/z, [sp, #32, mul vl] // 32-byte Folded Reload
287
289
; PAIR-NEXT: ldr p14, [sp, #5, mul vl] // 2-byte Folded Reload
288
290
; PAIR-NEXT: ldr p13, [sp, #6, mul vl] // 2-byte Folded Reload
289
291
; PAIR-NEXT: ldr p12, [sp, #7, mul vl] // 2-byte Folded Reload
0 commit comments