@@ -495,17 +495,17 @@ define amdgpu_kernel void @usage_direct_recursion(i32 %n) #0 {
495
495
; GCN: NumVgprs: max(43, multi_stage_recurse1.num_vgpr)
496
496
; GCN: ScratchSize: 16+max(multi_stage_recurse1.private_seg_size)
497
497
; GCN-LABEL: {{^}}multi_stage_recurse1:
498
- ; GCN: .set multi_stage_recurse1.num_vgpr, max(48, amdgpu.max_num_vgpr )
499
- ; GCN: .set multi_stage_recurse1.num_agpr, max(0, amdgpu.max_num_agpr )
500
- ; GCN: .set multi_stage_recurse1.numbered_sgpr, max(34, amdgpu.max_num_sgpr )
498
+ ; GCN: .set multi_stage_recurse1.num_vgpr, max(48, 43 )
499
+ ; GCN: .set multi_stage_recurse1.num_agpr, max(0, 0 )
500
+ ; GCN: .set multi_stage_recurse1.numbered_sgpr, max(34, 34 )
501
501
; GCN: .set multi_stage_recurse1.private_seg_size, 16
502
502
; GCN: .set multi_stage_recurse1.uses_vcc, 1
503
503
; GCN: .set multi_stage_recurse1.uses_flat_scratch, 0
504
504
; GCN: .set multi_stage_recurse1.has_dyn_sized_stack, 0
505
505
; GCN: .set multi_stage_recurse1.has_recursion, 1
506
506
; GCN: .set multi_stage_recurse1.has_indirect_call, 0
507
- ; GCN: TotalNumSgprs: multi_stage_recurse1.numbered_sgpr+4
508
- ; GCN: NumVgprs: max(48, amdgpu.max_num_vgpr)
507
+ ; GCN: TotalNumSgprs: 38
508
+ ; GCN: NumVgprs: 48
509
509
; GCN: ScratchSize: 16
510
510
define void @multi_stage_recurse1 (i32 %val ) #2 {
511
511
call void @multi_stage_recurse2 (i32 %val )
@@ -528,8 +528,8 @@ define void @multi_stage_recurse2(i32 %val) #2 {
528
528
; GCN: .set usage_multi_stage_recurse.has_dyn_sized_stack, or(0, multi_stage_recurse1.has_dyn_sized_stack)
529
529
; GCN: .set usage_multi_stage_recurse.has_recursion, or(1, multi_stage_recurse1.has_recursion)
530
530
; GCN: .set usage_multi_stage_recurse.has_indirect_call, or(0, multi_stage_recurse1.has_indirect_call)
531
- ; GCN: TotalNumSgprs: usage_multi_stage_recurse.numbered_sgpr+6
532
- ; GCN: NumVgprs: usage_multi_stage_recurse.num_vgpr
531
+ ; GCN: TotalNumSgprs: 40
532
+ ; GCN: NumVgprs: 48
533
533
; GCN: ScratchSize: 16
534
534
define amdgpu_kernel void @usage_multi_stage_recurse (i32 %n ) #0 {
535
535
call void @multi_stage_recurse1 (i32 %n )
@@ -550,17 +550,17 @@ define amdgpu_kernel void @usage_multi_stage_recurse(i32 %n) #0 {
550
550
; GCN: NumVgprs: max(41, multi_stage_recurse_noattr1.num_vgpr)
551
551
; GCN: ScratchSize: 16+max(multi_stage_recurse_noattr1.private_seg_size)
552
552
; GCN-LABEL: {{^}}multi_stage_recurse_noattr1:
553
- ; GCN: .set multi_stage_recurse_noattr1.num_vgpr, max(41, amdgpu.max_num_vgpr )
554
- ; GCN: .set multi_stage_recurse_noattr1.num_agpr, max(0, amdgpu.max_num_agpr )
555
- ; GCN: .set multi_stage_recurse_noattr1.numbered_sgpr, max(57, amdgpu.max_num_sgpr )
553
+ ; GCN: .set multi_stage_recurse_noattr1.num_vgpr, max(41, 41 )
554
+ ; GCN: .set multi_stage_recurse_noattr1.num_agpr, max(0, 0 )
555
+ ; GCN: .set multi_stage_recurse_noattr1.numbered_sgpr, max(57, 54 )
556
556
; GCN: .set multi_stage_recurse_noattr1.private_seg_size, 16
557
557
; GCN: .set multi_stage_recurse_noattr1.uses_vcc, 1
558
558
; GCN: .set multi_stage_recurse_noattr1.uses_flat_scratch, 0
559
559
; GCN: .set multi_stage_recurse_noattr1.has_dyn_sized_stack, 0
560
560
; GCN: .set multi_stage_recurse_noattr1.has_recursion, 0
561
561
; GCN: .set multi_stage_recurse_noattr1.has_indirect_call, 0
562
- ; GCN: TotalNumSgprs: multi_stage_recurse_noattr1.numbered_sgpr+4
563
- ; GCN: NumVgprs: max(41, amdgpu.max_num_vgpr)
562
+ ; GCN: TotalNumSgprs: 61
563
+ ; GCN: NumVgprs: 41
564
564
; GCN: ScratchSize: 16
565
565
define void @multi_stage_recurse_noattr1 (i32 %val ) #0 {
566
566
call void @multi_stage_recurse_noattr2 (i32 %val )
@@ -583,8 +583,8 @@ define void @multi_stage_recurse_noattr2(i32 %val) #0 {
583
583
; GCN: .set usage_multi_stage_recurse_noattrs.has_dyn_sized_stack, or(0, multi_stage_recurse_noattr1.has_dyn_sized_stack)
584
584
; GCN: .set usage_multi_stage_recurse_noattrs.has_recursion, or(0, multi_stage_recurse_noattr1.has_recursion)
585
585
; GCN: .set usage_multi_stage_recurse_noattrs.has_indirect_call, or(0, multi_stage_recurse_noattr1.has_indirect_call)
586
- ; GCN: TotalNumSgprs: usage_multi_stage_recurse_noattrs.numbered_sgpr+6
587
- ; GCN: NumVgprs: usage_multi_stage_recurse_noattrs.num_vgpr
586
+ ; GCN: TotalNumSgprs: 63
587
+ ; GCN: NumVgprs: 41
588
588
; GCN: ScratchSize: 16
589
589
define amdgpu_kernel void @usage_multi_stage_recurse_noattrs (i32 %n ) #0 {
590
590
call void @multi_stage_recurse_noattr1 (i32 %n )
@@ -601,8 +601,8 @@ define amdgpu_kernel void @usage_multi_stage_recurse_noattrs(i32 %n) #0 {
601
601
; GCN: .set multi_call_with_multi_stage_recurse.has_dyn_sized_stack, or(0, use_stack0.has_dyn_sized_stack, use_stack1.has_dyn_sized_stack, multi_stage_recurse1.has_dyn_sized_stack)
602
602
; GCN: .set multi_call_with_multi_stage_recurse.has_recursion, or(1, use_stack0.has_recursion, use_stack1.has_recursion, multi_stage_recurse1.has_recursion)
603
603
; GCN: .set multi_call_with_multi_stage_recurse.has_indirect_call, or(0, use_stack0.has_indirect_call, use_stack1.has_indirect_call, multi_stage_recurse1.has_indirect_call)
604
- ; GCN: TotalNumSgprs: multi_call_with_multi_stage_recurse.numbered_sgpr+6
605
- ; GCN: NumVgprs: multi_call_with_multi_stage_recurse.num_vgpr
604
+ ; GCN: TotalNumSgprs: 59
605
+ ; GCN: NumVgprs: 48
606
606
; GCN: ScratchSize: 2052
607
607
define amdgpu_kernel void @multi_call_with_multi_stage_recurse (i32 %n ) #0 {
608
608
call void @use_stack0 ()
0 commit comments