@@ -2591,24 +2591,24 @@ define amdgpu_kernel void @test_mfma_scale_f32_32x32x64_f8f6f4_0_0__vgprcd_nonma
2591
2591
; SDAG-NEXT: v_mov_b32_e32 v14, s26
2592
2592
; SDAG-NEXT: v_mov_b32_e32 v15, s27
2593
2593
; SDAG-NEXT: s_waitcnt lgkmcnt(0)
2594
- ; SDAG-NEXT: v_accvgpr_write_b32 a0, s8
2595
- ; SDAG-NEXT: v_accvgpr_write_b32 a1, s9
2596
- ; SDAG-NEXT: v_accvgpr_write_b32 a2, s10
2597
- ; SDAG-NEXT: v_accvgpr_write_b32 a3, s11
2598
- ; SDAG-NEXT: v_accvgpr_write_b32 a4, s12
2599
- ; SDAG-NEXT: v_accvgpr_write_b32 a5, s13
2600
- ; SDAG-NEXT: v_accvgpr_write_b32 a6, s14
2601
- ; SDAG-NEXT: v_accvgpr_write_b32 a7, s15
2602
- ; SDAG-NEXT: v_accvgpr_write_b32 a8, s16
2603
- ; SDAG-NEXT: v_accvgpr_write_b32 a9, s17
2604
- ; SDAG-NEXT: v_accvgpr_write_b32 a10, s18
2605
- ; SDAG-NEXT: v_accvgpr_write_b32 a11, s19
2606
- ; SDAG-NEXT: v_accvgpr_write_b32 a12, s20
2607
- ; SDAG-NEXT: v_accvgpr_write_b32 a13, s21
2608
- ; SDAG-NEXT: v_accvgpr_write_b32 a14, s22
2609
- ; SDAG-NEXT: v_accvgpr_write_b32 a15, s23
2594
+ ; SDAG-NEXT: v_accvgpr_write_b32 a31, s23
2595
+ ; SDAG-NEXT: v_accvgpr_write_b32 a30, s22
2596
+ ; SDAG-NEXT: v_accvgpr_write_b32 a29, s21
2597
+ ; SDAG-NEXT: v_accvgpr_write_b32 a28, s20
2598
+ ; SDAG-NEXT: v_accvgpr_write_b32 a27, s19
2599
+ ; SDAG-NEXT: v_accvgpr_write_b32 a26, s18
2600
+ ; SDAG-NEXT: v_accvgpr_write_b32 a25, s17
2601
+ ; SDAG-NEXT: v_accvgpr_write_b32 a24, s16
2602
+ ; SDAG-NEXT: v_accvgpr_write_b32 a23, s15
2603
+ ; SDAG-NEXT: v_accvgpr_write_b32 a22, s14
2604
+ ; SDAG-NEXT: v_accvgpr_write_b32 a21, s13
2605
+ ; SDAG-NEXT: v_accvgpr_write_b32 a20, s12
2606
+ ; SDAG-NEXT: v_accvgpr_write_b32 a19, s11
2607
+ ; SDAG-NEXT: v_accvgpr_write_b32 a18, s10
2608
+ ; SDAG-NEXT: v_accvgpr_write_b32 a17, s9
2609
+ ; SDAG-NEXT: v_accvgpr_write_b32 a16, s8
2610
2610
; SDAG-NEXT: s_nop 1
2611
- ; SDAG-NEXT: v_mfma_scale_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[0:15], 0, 0 op_sel_hi:[0,0,0 ] cbsz:1 abid:2 blgp:3
2611
+ ; SDAG-NEXT: v_mfma_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[16:31 ] cbsz:1 abid:2 blgp:3
2612
2612
; SDAG-NEXT: v_mov_b32_e32 v0, s20
2613
2613
; SDAG-NEXT: v_mov_b32_e32 v1, s21
2614
2614
; SDAG-NEXT: v_mov_b32_e32 v2, s22
@@ -2655,31 +2655,31 @@ define amdgpu_kernel void @test_mfma_scale_f32_32x32x64_f8f6f4_0_0__vgprcd_nonma
2655
2655
; GISEL-NEXT: s_waitcnt lgkmcnt(0)
2656
2656
; GISEL-NEXT: v_mov_b64_e32 v[0:1], s[36:37]
2657
2657
; GISEL-NEXT: v_mov_b64_e32 v[8:9], s[44:45]
2658
- ; GISEL-NEXT: v_accvgpr_write_b32 a0, s8
2658
+ ; GISEL-NEXT: v_accvgpr_write_b32 a31, s23
2659
2659
; GISEL-NEXT: v_mov_b64_e32 v[2:3], s[38:39]
2660
2660
; GISEL-NEXT: v_mov_b64_e32 v[4:5], s[40:41]
2661
2661
; GISEL-NEXT: v_mov_b64_e32 v[6:7], s[42:43]
2662
2662
; GISEL-NEXT: v_mov_b64_e32 v[10:11], s[46:47]
2663
2663
; GISEL-NEXT: v_mov_b64_e32 v[12:13], s[48:49]
2664
2664
; GISEL-NEXT: v_mov_b64_e32 v[14:15], s[50:51]
2665
- ; GISEL-NEXT: v_accvgpr_write_b32 a1, s9
2666
- ; GISEL-NEXT: v_accvgpr_write_b32 a2, s10
2667
- ; GISEL-NEXT: v_accvgpr_write_b32 a3, s11
2668
- ; GISEL-NEXT: v_accvgpr_write_b32 a4, s12
2669
- ; GISEL-NEXT: v_accvgpr_write_b32 a5, s13
2670
- ; GISEL-NEXT: v_accvgpr_write_b32 a6, s14
2671
- ; GISEL-NEXT: v_accvgpr_write_b32 a7, s15
2672
- ; GISEL-NEXT: v_accvgpr_write_b32 a8, s16
2673
- ; GISEL-NEXT: v_accvgpr_write_b32 a9, s17
2674
- ; GISEL-NEXT: v_accvgpr_write_b32 a10, s18
2675
- ; GISEL-NEXT: v_accvgpr_write_b32 a11, s19
2676
- ; GISEL-NEXT: v_accvgpr_write_b32 a12, s20
2677
- ; GISEL-NEXT: v_accvgpr_write_b32 a13, s21
2678
- ; GISEL-NEXT: v_accvgpr_write_b32 a14, s22
2679
- ; GISEL-NEXT: v_accvgpr_write_b32 a15, s23
2665
+ ; GISEL-NEXT: v_accvgpr_write_b32 a30, s22
2666
+ ; GISEL-NEXT: v_accvgpr_write_b32 a29, s21
2667
+ ; GISEL-NEXT: v_accvgpr_write_b32 a28, s20
2668
+ ; GISEL-NEXT: v_accvgpr_write_b32 a27, s19
2669
+ ; GISEL-NEXT: v_accvgpr_write_b32 a26, s18
2670
+ ; GISEL-NEXT: v_accvgpr_write_b32 a25, s17
2671
+ ; GISEL-NEXT: v_accvgpr_write_b32 a24, s16
2672
+ ; GISEL-NEXT: v_accvgpr_write_b32 a23, s15
2673
+ ; GISEL-NEXT: v_accvgpr_write_b32 a22, s14
2674
+ ; GISEL-NEXT: v_accvgpr_write_b32 a21, s13
2675
+ ; GISEL-NEXT: v_accvgpr_write_b32 a20, s12
2676
+ ; GISEL-NEXT: v_accvgpr_write_b32 a19, s11
2677
+ ; GISEL-NEXT: v_accvgpr_write_b32 a18, s10
2678
+ ; GISEL-NEXT: v_accvgpr_write_b32 a17, s9
2679
+ ; GISEL-NEXT: v_accvgpr_write_b32 a16, s8
2680
2680
; GISEL-NEXT: v_mov_b64_e32 v[18:19], s[10:11]
2681
2681
; GISEL-NEXT: v_mov_b64_e32 v[16:17], s[8:9]
2682
- ; GISEL-NEXT: v_mfma_scale_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[0:15], 0, 0 op_sel_hi:[0,0,0 ] cbsz:1 abid:2 blgp:3
2682
+ ; GISEL-NEXT: v_mfma_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[16:31 ] cbsz:1 abid:2 blgp:3
2683
2683
; GISEL-NEXT: v_mov_b64_e32 v[0:1], s[12:13]
2684
2684
; GISEL-NEXT: v_mov_b64_e32 v[4:5], 0
2685
2685
; GISEL-NEXT: v_mov_b64_e32 v[2:3], s[14:15]
@@ -2887,7 +2887,7 @@ define <16 x float> @test_mfma_scale_f32_32x32x64_f8f6f4___constant_scale_0_0_a(
2887
2887
; GCN-NEXT: v_accvgpr_write_b32 a14, v30
2888
2888
; GCN-NEXT: s_waitcnt vmcnt(0)
2889
2889
; GCN-NEXT: s_nop 0
2890
- ; GCN-NEXT: v_mfma_scale_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[0:15], 0, 0 op_sel_hi:[0,0,0 ]
2890
+ ; GCN-NEXT: v_mfma_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[0:15]
2891
2891
; GCN-NEXT: s_nop 3
2892
2892
; GCN-NEXT: v_accvgpr_read_b32 v0, a0
2893
2893
; GCN-NEXT: v_accvgpr_read_b32 v1, a1
@@ -2935,7 +2935,7 @@ define <16 x float> @test_mfma_scale_f32_32x32x64_f8f6f4___constant_scale_0_0_b(
2935
2935
; GCN-NEXT: v_accvgpr_write_b32 a14, v30
2936
2936
; GCN-NEXT: s_waitcnt vmcnt(0)
2937
2937
; GCN-NEXT: s_nop 0
2938
- ; GCN-NEXT: v_mfma_scale_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[0:15], 0, 0 op_sel_hi:[0,0,0 ]
2938
+ ; GCN-NEXT: v_mfma_f32_32x32x64_f8f6f4 a[0:15], v[0:7], v[8:15], a[0:15]
2939
2939
; GCN-NEXT: s_nop 3
2940
2940
; GCN-NEXT: v_accvgpr_read_b32 v0, a0
2941
2941
; GCN-NEXT: v_accvgpr_read_b32 v1, a1
0 commit comments