@@ -45,7 +45,7 @@ define float @test_cvt_f32_bf8_byte1(i32 %a) {
45
45
; GFX12-NEXT: s_wait_samplecnt 0x0
46
46
; GFX12-NEXT: s_wait_bvhcnt 0x0
47
47
; GFX12-NEXT: s_wait_kmcnt 0x0
48
- ; GFX12-NEXT: v_cvt_f32_bf8_e64 v0, v0 op_sel:[1,0 ]
48
+ ; GFX12-NEXT: v_cvt_f32_bf8_e64 v0, v0 op_sel:[0,1 ]
49
49
; GFX12-NEXT: s_setpc_b64 s[30:31]
50
50
%ret = tail call float @llvm.amdgcn.cvt.f32.bf8 (i32 %a , i32 1 )
51
51
ret float %ret
@@ -65,7 +65,7 @@ define float @test_cvt_f32_bf8_byte2(i32 %a) {
65
65
; GFX12-NEXT: s_wait_samplecnt 0x0
66
66
; GFX12-NEXT: s_wait_bvhcnt 0x0
67
67
; GFX12-NEXT: s_wait_kmcnt 0x0
68
- ; GFX12-NEXT: v_cvt_f32_bf8_e64 v0, v0 op_sel:[0,1 ]
68
+ ; GFX12-NEXT: v_cvt_f32_bf8_e64 v0, v0 op_sel:[1,0 ]
69
69
; GFX12-NEXT: s_setpc_b64 s[30:31]
70
70
%ret = tail call float @llvm.amdgcn.cvt.f32.bf8 (i32 %a , i32 2 )
71
71
ret float %ret
@@ -125,7 +125,7 @@ define float @test_cvt_f32_fp8_byte1(i32 %a) {
125
125
; GFX12-NEXT: s_wait_samplecnt 0x0
126
126
; GFX12-NEXT: s_wait_bvhcnt 0x0
127
127
; GFX12-NEXT: s_wait_kmcnt 0x0
128
- ; GFX12-NEXT: v_cvt_f32_fp8_e64 v0, v0 op_sel:[1,0 ]
128
+ ; GFX12-NEXT: v_cvt_f32_fp8_e64 v0, v0 op_sel:[0,1 ]
129
129
; GFX12-NEXT: s_setpc_b64 s[30:31]
130
130
%ret = tail call float @llvm.amdgcn.cvt.f32.fp8 (i32 %a , i32 1 )
131
131
ret float %ret
@@ -145,7 +145,7 @@ define float @test_cvt_f32_fp8_byte2(i32 %a) {
145
145
; GFX12-NEXT: s_wait_samplecnt 0x0
146
146
; GFX12-NEXT: s_wait_bvhcnt 0x0
147
147
; GFX12-NEXT: s_wait_kmcnt 0x0
148
- ; GFX12-NEXT: v_cvt_f32_fp8_e64 v0, v0 op_sel:[0,1 ]
148
+ ; GFX12-NEXT: v_cvt_f32_fp8_e64 v0, v0 op_sel:[1,0 ]
149
149
; GFX12-NEXT: s_setpc_b64 s[30:31]
150
150
%ret = tail call float @llvm.amdgcn.cvt.f32.fp8 (i32 %a , i32 2 )
151
151
ret float %ret
0 commit comments