@@ -11,12 +11,14 @@ declare double @normal_callee(double)
11
11
define double @nonstreaming_caller_streaming_callee (double %x ) nounwind noinline optnone {
12
12
; CHECK-FISEL-LABEL: nonstreaming_caller_streaming_callee:
13
13
; CHECK-FISEL: // %bb.0: // %entry
14
+ ; CHECK-FISEL-NEXT: cntd x9
14
15
; CHECK-FISEL-NEXT: sub sp, sp, #96
15
16
; CHECK-FISEL-NEXT: stp d15, d14, [sp, #16] // 16-byte Folded Spill
16
17
; CHECK-FISEL-NEXT: stp d13, d12, [sp, #32] // 16-byte Folded Spill
17
18
; CHECK-FISEL-NEXT: stp d11, d10, [sp, #48] // 16-byte Folded Spill
18
19
; CHECK-FISEL-NEXT: stp d9, d8, [sp, #64] // 16-byte Folded Spill
19
20
; CHECK-FISEL-NEXT: str x30, [sp, #80] // 8-byte Folded Spill
21
+ ; CHECK-FISEL-NEXT: str x9, [sp, #88] // 8-byte Folded Spill
20
22
; CHECK-FISEL-NEXT: str d0, [sp] // 8-byte Folded Spill
21
23
; CHECK-FISEL-NEXT: smstart sm
22
24
; CHECK-FISEL-NEXT: ldr d0, [sp] // 8-byte Folded Reload
@@ -37,12 +39,14 @@ define double @nonstreaming_caller_streaming_callee(double %x) nounwind noinline
37
39
;
38
40
; CHECK-GISEL-LABEL: nonstreaming_caller_streaming_callee:
39
41
; CHECK-GISEL: // %bb.0: // %entry
42
+ ; CHECK-GISEL-NEXT: cntd x9
40
43
; CHECK-GISEL-NEXT: sub sp, sp, #96
41
44
; CHECK-GISEL-NEXT: stp d15, d14, [sp, #16] // 16-byte Folded Spill
42
45
; CHECK-GISEL-NEXT: stp d13, d12, [sp, #32] // 16-byte Folded Spill
43
46
; CHECK-GISEL-NEXT: stp d11, d10, [sp, #48] // 16-byte Folded Spill
44
47
; CHECK-GISEL-NEXT: stp d9, d8, [sp, #64] // 16-byte Folded Spill
45
48
; CHECK-GISEL-NEXT: str x30, [sp, #80] // 8-byte Folded Spill
49
+ ; CHECK-GISEL-NEXT: str x9, [sp, #88] // 8-byte Folded Spill
46
50
; CHECK-GISEL-NEXT: str d0, [sp] // 8-byte Folded Spill
47
51
; CHECK-GISEL-NEXT: smstart sm
48
52
; CHECK-GISEL-NEXT: ldr d0, [sp] // 8-byte Folded Reload
@@ -70,12 +74,14 @@ entry:
70
74
define double @streaming_caller_nonstreaming_callee (double %x ) nounwind noinline optnone "aarch64_pstate_sm_enabled" {
71
75
; CHECK-COMMON-LABEL: streaming_caller_nonstreaming_callee:
72
76
; CHECK-COMMON: // %bb.0: // %entry
77
+ ; CHECK-COMMON-NEXT: cntd x9
73
78
; CHECK-COMMON-NEXT: sub sp, sp, #96
74
79
; CHECK-COMMON-NEXT: stp d15, d14, [sp, #16] // 16-byte Folded Spill
75
80
; CHECK-COMMON-NEXT: stp d13, d12, [sp, #32] // 16-byte Folded Spill
76
81
; CHECK-COMMON-NEXT: stp d11, d10, [sp, #48] // 16-byte Folded Spill
77
82
; CHECK-COMMON-NEXT: stp d9, d8, [sp, #64] // 16-byte Folded Spill
78
83
; CHECK-COMMON-NEXT: str x30, [sp, #80] // 8-byte Folded Spill
84
+ ; CHECK-COMMON-NEXT: str x9, [sp, #88] // 8-byte Folded Spill
79
85
; CHECK-COMMON-NEXT: str d0, [sp] // 8-byte Folded Spill
80
86
; CHECK-COMMON-NEXT: smstop sm
81
87
; CHECK-COMMON-NEXT: ldr d0, [sp] // 8-byte Folded Reload
@@ -102,12 +108,14 @@ entry:
102
108
define double @locally_streaming_caller_normal_callee (double %x ) nounwind noinline optnone "aarch64_pstate_sm_body" {
103
109
; CHECK-COMMON-LABEL: locally_streaming_caller_normal_callee:
104
110
; CHECK-COMMON: // %bb.0:
111
+ ; CHECK-COMMON-NEXT: cntd x9
105
112
; CHECK-COMMON-NEXT: sub sp, sp, #112
106
113
; CHECK-COMMON-NEXT: stp d15, d14, [sp, #32] // 16-byte Folded Spill
107
114
; CHECK-COMMON-NEXT: stp d13, d12, [sp, #48] // 16-byte Folded Spill
108
115
; CHECK-COMMON-NEXT: stp d11, d10, [sp, #64] // 16-byte Folded Spill
109
116
; CHECK-COMMON-NEXT: stp d9, d8, [sp, #80] // 16-byte Folded Spill
110
117
; CHECK-COMMON-NEXT: str x30, [sp, #96] // 8-byte Folded Spill
118
+ ; CHECK-COMMON-NEXT: str x9, [sp, #104] // 8-byte Folded Spill
111
119
; CHECK-COMMON-NEXT: str d0, [sp, #24] // 8-byte Folded Spill
112
120
; CHECK-COMMON-NEXT: smstart sm
113
121
; CHECK-COMMON-NEXT: ldr d0, [sp, #24] // 8-byte Folded Reload
@@ -166,11 +174,13 @@ define double @normal_caller_to_locally_streaming_callee(double %x) nounwind noi
166
174
define void @locally_streaming_caller_streaming_callee_ptr (ptr %p ) nounwind noinline optnone "aarch64_pstate_sm_body" {
167
175
; CHECK-COMMON-LABEL: locally_streaming_caller_streaming_callee_ptr:
168
176
; CHECK-COMMON: // %bb.0:
177
+ ; CHECK-COMMON-NEXT: cntd x9
169
178
; CHECK-COMMON-NEXT: stp d15, d14, [sp, #-80]! // 16-byte Folded Spill
170
179
; CHECK-COMMON-NEXT: stp d13, d12, [sp, #16] // 16-byte Folded Spill
171
180
; CHECK-COMMON-NEXT: stp d11, d10, [sp, #32] // 16-byte Folded Spill
172
181
; CHECK-COMMON-NEXT: stp d9, d8, [sp, #48] // 16-byte Folded Spill
173
182
; CHECK-COMMON-NEXT: str x30, [sp, #64] // 8-byte Folded Spill
183
+ ; CHECK-COMMON-NEXT: str x9, [sp, #72] // 8-byte Folded Spill
174
184
; CHECK-COMMON-NEXT: smstart sm
175
185
; CHECK-COMMON-NEXT: blr x0
176
186
; CHECK-COMMON-NEXT: smstop sm
@@ -187,11 +197,13 @@ define void @locally_streaming_caller_streaming_callee_ptr(ptr %p) nounwind noin
187
197
define void @normal_call_to_streaming_callee_ptr (ptr %p ) nounwind noinline optnone {
188
198
; CHECK-COMMON-LABEL: normal_call_to_streaming_callee_ptr:
189
199
; CHECK-COMMON: // %bb.0:
200
+ ; CHECK-COMMON-NEXT: cntd x9
190
201
; CHECK-COMMON-NEXT: stp d15, d14, [sp, #-80]! // 16-byte Folded Spill
191
202
; CHECK-COMMON-NEXT: stp d13, d12, [sp, #16] // 16-byte Folded Spill
192
203
; CHECK-COMMON-NEXT: stp d11, d10, [sp, #32] // 16-byte Folded Spill
193
204
; CHECK-COMMON-NEXT: stp d9, d8, [sp, #48] // 16-byte Folded Spill
194
205
; CHECK-COMMON-NEXT: str x30, [sp, #64] // 8-byte Folded Spill
206
+ ; CHECK-COMMON-NEXT: str x9, [sp, #72] // 8-byte Folded Spill
195
207
; CHECK-COMMON-NEXT: smstart sm
196
208
; CHECK-COMMON-NEXT: blr x0
197
209
; CHECK-COMMON-NEXT: smstop sm
@@ -325,12 +337,13 @@ define fp128 @f128_call_za(fp128 %a, fp128 %b) "aarch64_inout_za" nounwind {
325
337
define fp128 @f128_call_sm (fp128 %a , fp128 %b ) "aarch64_pstate_sm_enabled" nounwind {
326
338
; CHECK-COMMON-LABEL: f128_call_sm:
327
339
; CHECK-COMMON: // %bb.0:
340
+ ; CHECK-COMMON-NEXT: cntd x9
328
341
; CHECK-COMMON-NEXT: sub sp, sp, #112
329
342
; CHECK-COMMON-NEXT: stp d15, d14, [sp, #32] // 16-byte Folded Spill
330
343
; CHECK-COMMON-NEXT: stp d13, d12, [sp, #48] // 16-byte Folded Spill
331
344
; CHECK-COMMON-NEXT: stp d11, d10, [sp, #64] // 16-byte Folded Spill
332
345
; CHECK-COMMON-NEXT: stp d9, d8, [sp, #80] // 16-byte Folded Spill
333
- ; CHECK-COMMON-NEXT: str x30, [sp, #96] // 8 -byte Folded Spill
346
+ ; CHECK-COMMON-NEXT: stp x30, x9, [sp, #96] // 16 -byte Folded Spill
334
347
; CHECK-COMMON-NEXT: stp q1, q0, [sp] // 32-byte Folded Spill
335
348
; CHECK-COMMON-NEXT: smstop sm
336
349
; CHECK-COMMON-NEXT: ldp q1, q0, [sp] // 32-byte Folded Reload
@@ -386,12 +399,13 @@ define double @frem_call_za(double %a, double %b) "aarch64_inout_za" nounwind {
386
399
define float @frem_call_sm (float %a , float %b ) "aarch64_pstate_sm_enabled" nounwind {
387
400
; CHECK-COMMON-LABEL: frem_call_sm:
388
401
; CHECK-COMMON: // %bb.0:
402
+ ; CHECK-COMMON-NEXT: cntd x9
389
403
; CHECK-COMMON-NEXT: sub sp, sp, #96
390
404
; CHECK-COMMON-NEXT: stp d15, d14, [sp, #16] // 16-byte Folded Spill
391
405
; CHECK-COMMON-NEXT: stp d13, d12, [sp, #32] // 16-byte Folded Spill
392
406
; CHECK-COMMON-NEXT: stp d11, d10, [sp, #48] // 16-byte Folded Spill
393
407
; CHECK-COMMON-NEXT: stp d9, d8, [sp, #64] // 16-byte Folded Spill
394
- ; CHECK-COMMON-NEXT: str x30, [sp, #80] // 8 -byte Folded Spill
408
+ ; CHECK-COMMON-NEXT: stp x30, x9, [sp, #80] // 16 -byte Folded Spill
395
409
; CHECK-COMMON-NEXT: stp s1, s0, [sp, #8] // 8-byte Folded Spill
396
410
; CHECK-COMMON-NEXT: smstop sm
397
411
; CHECK-COMMON-NEXT: ldp s1, s0, [sp, #8] // 8-byte Folded Reload
@@ -414,12 +428,14 @@ define float @frem_call_sm(float %a, float %b) "aarch64_pstate_sm_enabled" nounw
414
428
define float @frem_call_sm_compat (float %a , float %b ) "aarch64_pstate_sm_compatible" nounwind {
415
429
; CHECK-COMMON-LABEL: frem_call_sm_compat:
416
430
; CHECK-COMMON: // %bb.0:
417
- ; CHECK-COMMON-NEXT: sub sp, sp, #96
431
+ ; CHECK-COMMON-NEXT: cntd x9
432
+ ; CHECK-COMMON-NEXT: sub sp, sp, #112
418
433
; CHECK-COMMON-NEXT: stp d15, d14, [sp, #16] // 16-byte Folded Spill
419
434
; CHECK-COMMON-NEXT: stp d13, d12, [sp, #32] // 16-byte Folded Spill
420
435
; CHECK-COMMON-NEXT: stp d11, d10, [sp, #48] // 16-byte Folded Spill
421
436
; CHECK-COMMON-NEXT: stp d9, d8, [sp, #64] // 16-byte Folded Spill
422
- ; CHECK-COMMON-NEXT: stp x30, x19, [sp, #80] // 16-byte Folded Spill
437
+ ; CHECK-COMMON-NEXT: stp x30, x9, [sp, #80] // 16-byte Folded Spill
438
+ ; CHECK-COMMON-NEXT: str x19, [sp, #96] // 8-byte Folded Spill
423
439
; CHECK-COMMON-NEXT: stp s0, s1, [sp, #8] // 8-byte Folded Spill
424
440
; CHECK-COMMON-NEXT: bl __arm_sme_state
425
441
; CHECK-COMMON-NEXT: ldp s2, s0, [sp, #8] // 8-byte Folded Reload
@@ -436,13 +452,14 @@ define float @frem_call_sm_compat(float %a, float %b) "aarch64_pstate_sm_compati
436
452
; CHECK-COMMON-NEXT: // %bb.3:
437
453
; CHECK-COMMON-NEXT: smstart sm
438
454
; CHECK-COMMON-NEXT: .LBB12_4:
439
- ; CHECK-COMMON-NEXT: ldp x30, x19, [sp, #80] // 16-byte Folded Reload
440
- ; CHECK-COMMON-NEXT: ldr s0, [sp, #12] // 4-byte Folded Reload
441
455
; CHECK-COMMON-NEXT: ldp d9, d8, [sp, #64] // 16-byte Folded Reload
456
+ ; CHECK-COMMON-NEXT: ldr s0, [sp, #12] // 4-byte Folded Reload
442
457
; CHECK-COMMON-NEXT: ldp d11, d10, [sp, #48] // 16-byte Folded Reload
458
+ ; CHECK-COMMON-NEXT: ldr x19, [sp, #96] // 8-byte Folded Reload
459
+ ; CHECK-COMMON-NEXT: ldr x30, [sp, #80] // 8-byte Folded Reload
443
460
; CHECK-COMMON-NEXT: ldp d13, d12, [sp, #32] // 16-byte Folded Reload
444
461
; CHECK-COMMON-NEXT: ldp d15, d14, [sp, #16] // 16-byte Folded Reload
445
- ; CHECK-COMMON-NEXT: add sp, sp, #96
462
+ ; CHECK-COMMON-NEXT: add sp, sp, #112
446
463
; CHECK-COMMON-NEXT: ret
447
464
%res = frem float %a , %b
448
465
ret float %res
0 commit comments