@@ -12,7 +12,7 @@ define amdgpu_ps <4 x float> @load_2dmsaa(<8 x i32> inreg %rsrc, i32 %s, i32 %t,
12
12
; GFX12-LABEL: load_2dmsaa:
13
13
; GFX12: ; %bb.0: ; %main_body
14
14
; GFX12-NEXT: image_msaa_load v[0:3], [v0, v1, v2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm ; encoding: [0x06,0x20,0x46,0xe4,0x00,0x00,0x00,0x00,0x00,0x01,0x02,0x00]
15
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
15
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
16
16
; GFX12-NEXT: ; return to shader part epilog
17
17
main_body:
18
18
%v = call <4 x float > @llvm.amdgcn.image.msaa.load.2dmsaa.v4f32.i32 (i32 1 , i32 %s , i32 %t , i32 %fragid , <8 x i32 > %rsrc , i32 0 , i32 0 )
@@ -32,7 +32,7 @@ define amdgpu_ps <4 x float> @load_2dmsaa_both(<8 x i32> inreg %rsrc, ptr addrsp
32
32
; GFX12: ; %bb.0: ; %main_body
33
33
; GFX12-NEXT: image_msaa_load v[0:4], [v0, v1, v2], s[0:7] dmask:0x2 dim:SQ_RSRC_IMG_2D_MSAA unorm tfe lwe ; encoding: [0x0e,0x20,0x86,0xe4,0x00,0x01,0x00,0x00,0x00,0x01,0x02,0x00]
34
34
; GFX12-NEXT: v_mov_b32_e32 v5, 0 ; encoding: [0x80,0x02,0x0a,0x7e]
35
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
35
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
36
36
; GFX12-NEXT: global_store_b32 v5, v4, s[8:9] ; encoding: [0x08,0x80,0x06,0xee,0x00,0x00,0x00,0x02,0x05,0x00,0x00,0x00]
37
37
; GFX12-NEXT: ; return to shader part epilog
38
38
main_body:
@@ -53,7 +53,7 @@ define amdgpu_ps <4 x float> @load_2darraymsaa(<8 x i32> inreg %rsrc, i32 %s, i3
53
53
; GFX12-LABEL: load_2darraymsaa:
54
54
; GFX12: ; %bb.0: ; %main_body
55
55
; GFX12-NEXT: image_msaa_load v[0:3], [v0, v1, v2, v3], s[0:7] dmask:0x4 dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm ; encoding: [0x07,0x20,0x06,0xe5,0x00,0x00,0x00,0x00,0x00,0x01,0x02,0x03]
56
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
56
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
57
57
; GFX12-NEXT: ; return to shader part epilog
58
58
main_body:
59
59
%v = call <4 x float > @llvm.amdgcn.image.msaa.load.2darraymsaa.v4f32.i32 (i32 4 , i32 %s , i32 %t , i32 %slice , i32 %fragid , <8 x i32 > %rsrc , i32 0 , i32 0 )
@@ -73,7 +73,7 @@ define amdgpu_ps <4 x float> @load_2darraymsaa_tfe(<8 x i32> inreg %rsrc, ptr ad
73
73
; GFX12: ; %bb.0: ; %main_body
74
74
; GFX12-NEXT: image_msaa_load v[0:4], [v0, v1, v2, v3], s[0:7] dmask:0x8 dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm tfe ; encoding: [0x0f,0x20,0x06,0xe6,0x00,0x00,0x00,0x00,0x00,0x01,0x02,0x03]
75
75
; GFX12-NEXT: v_mov_b32_e32 v5, 0 ; encoding: [0x80,0x02,0x0a,0x7e]
76
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
76
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
77
77
; GFX12-NEXT: global_store_b32 v5, v4, s[8:9] ; encoding: [0x08,0x80,0x06,0xee,0x00,0x00,0x00,0x02,0x05,0x00,0x00,0x00]
78
78
; GFX12-NEXT: ; return to shader part epilog
79
79
main_body:
@@ -94,7 +94,7 @@ define amdgpu_ps <4 x float> @load_2dmsaa_glc(<8 x i32> inreg %rsrc, i32 %s, i32
94
94
; GFX12-LABEL: load_2dmsaa_glc:
95
95
; GFX12: ; %bb.0: ; %main_body
96
96
; GFX12-NEXT: image_msaa_load v[0:3], [v0, v1, v2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm th:TH_LOAD_NT ; encoding: [0x06,0x20,0x46,0xe4,0x00,0x00,0x10,0x00,0x00,0x01,0x02,0x00]
97
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
97
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
98
98
; GFX12-NEXT: ; return to shader part epilog
99
99
main_body:
100
100
%v = call <4 x float > @llvm.amdgcn.image.msaa.load.2dmsaa.v4f32.i32 (i32 1 , i32 %s , i32 %t , i32 %fragid , <8 x i32 > %rsrc , i32 0 , i32 1 )
@@ -111,7 +111,7 @@ define amdgpu_ps <4 x float> @load_2dmsaa_slc(<8 x i32> inreg %rsrc, i32 %s, i32
111
111
; GFX12-LABEL: load_2dmsaa_slc:
112
112
; GFX12: ; %bb.0: ; %main_body
113
113
; GFX12-NEXT: image_msaa_load v[0:3], [v0, v1, v2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm th:TH_LOAD_HT ; encoding: [0x06,0x20,0x46,0xe4,0x00,0x00,0x20,0x00,0x00,0x01,0x02,0x00]
114
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
114
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
115
115
; GFX12-NEXT: ; return to shader part epilog
116
116
main_body:
117
117
%v = call <4 x float > @llvm.amdgcn.image.msaa.load.2dmsaa.v4f32.i32 (i32 1 , i32 %s , i32 %t , i32 %fragid , <8 x i32 > %rsrc , i32 0 , i32 2 )
@@ -128,7 +128,7 @@ define amdgpu_ps <4 x float> @load_2dmsaa_glc_slc(<8 x i32> inreg %rsrc, i32 %s,
128
128
; GFX12-LABEL: load_2dmsaa_glc_slc:
129
129
; GFX12: ; %bb.0: ; %main_body
130
130
; GFX12-NEXT: image_msaa_load v[0:3], [v0, v1, v2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm th:TH_LOAD_LU ; encoding: [0x06,0x20,0x46,0xe4,0x00,0x00,0x30,0x00,0x00,0x01,0x02,0x00]
131
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
131
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
132
132
; GFX12-NEXT: ; return to shader part epilog
133
133
main_body:
134
134
%v = call <4 x float > @llvm.amdgcn.image.msaa.load.2dmsaa.v4f32.i32 (i32 1 , i32 %s , i32 %t , i32 %fragid , <8 x i32 > %rsrc , i32 0 , i32 3 )
@@ -145,7 +145,7 @@ define amdgpu_ps <4 x half> @load_2dmsaa_d16(<8 x i32> inreg %rsrc, i32 %s, i32
145
145
; GFX12-LABEL: load_2dmsaa_d16:
146
146
; GFX12: ; %bb.0: ; %main_body
147
147
; GFX12-NEXT: image_msaa_load v[0:1], [v0, v1, v2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm d16 ; encoding: [0x26,0x20,0x46,0xe4,0x00,0x00,0x00,0x00,0x00,0x01,0x02,0x00]
148
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
148
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
149
149
; GFX12-NEXT: ; return to shader part epilog
150
150
main_body:
151
151
%v = call <4 x half > @llvm.amdgcn.image.msaa.load.2dmsaa.v4f16.i32 (i32 1 , i32 %s , i32 %t , i32 %fragid , <8 x i32 > %rsrc , i32 0 , i32 0 )
@@ -165,7 +165,7 @@ define amdgpu_ps <4 x half> @load_2dmsaa_tfe_d16(<8 x i32> inreg %rsrc, ptr addr
165
165
; GFX12: ; %bb.0: ; %main_body
166
166
; GFX12-NEXT: image_msaa_load v[0:2], [v0, v1, v2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm tfe d16 ; encoding: [0x2e,0x20,0x46,0xe4,0x00,0x00,0x00,0x00,0x00,0x01,0x02,0x00]
167
167
; GFX12-NEXT: v_mov_b32_e32 v3, 0 ; encoding: [0x80,0x02,0x06,0x7e]
168
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
168
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
169
169
; GFX12-NEXT: global_store_b32 v3, v2, s[8:9] ; encoding: [0x08,0x80,0x06,0xee,0x00,0x00,0x00,0x01,0x03,0x00,0x00,0x00]
170
170
; GFX12-NEXT: ; return to shader part epilog
171
171
main_body:
@@ -186,7 +186,7 @@ define amdgpu_ps <4 x half> @load_2darraymsaa_d16(<8 x i32> inreg %rsrc, i32 %s,
186
186
; GFX12-LABEL: load_2darraymsaa_d16:
187
187
; GFX12: ; %bb.0: ; %main_body
188
188
; GFX12-NEXT: image_msaa_load v[0:1], [v0, v1, v2, v3], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm d16 ; encoding: [0x27,0x20,0x46,0xe4,0x00,0x00,0x00,0x00,0x00,0x01,0x02,0x03]
189
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
189
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
190
190
; GFX12-NEXT: ; return to shader part epilog
191
191
main_body:
192
192
%v = call <4 x half > @llvm.amdgcn.image.msaa.load.2darraymsaa.v4f16.i32 (i32 1 , i32 %s , i32 %t , i32 %slice , i32 %fragid , <8 x i32 > %rsrc , i32 0 , i32 0 )
@@ -206,7 +206,7 @@ define amdgpu_ps <4 x half> @load_2darraymsaa_tfe_d16(<8 x i32> inreg %rsrc, ptr
206
206
; GFX12: ; %bb.0: ; %main_body
207
207
; GFX12-NEXT: image_msaa_load v[0:2], [v0, v1, v2, v3], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm tfe d16 ; encoding: [0x2f,0x20,0x46,0xe4,0x00,0x00,0x00,0x00,0x00,0x01,0x02,0x03]
208
208
; GFX12-NEXT: v_mov_b32_e32 v3, 0 ; encoding: [0x80,0x02,0x06,0x7e]
209
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
209
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
210
210
; GFX12-NEXT: global_store_b32 v3, v2, s[8:9] ; encoding: [0x08,0x80,0x06,0xee,0x00,0x00,0x00,0x01,0x03,0x00,0x00,0x00]
211
211
; GFX12-NEXT: ; return to shader part epilog
212
212
main_body:
@@ -229,7 +229,7 @@ define amdgpu_ps <4 x float> @load_2dmsaa_a16(<8 x i32> inreg %rsrc, i16 %s, i16
229
229
; GFX12: ; %bb.0: ; %main_body
230
230
; GFX12-NEXT: v_perm_b32 v0, v1, v0, 0x5040100 ; encoding: [0x00,0x00,0x44,0xd6,0x01,0x01,0xfe,0x03,0x00,0x01,0x04,0x05]
231
231
; GFX12-NEXT: image_msaa_load v[0:3], [v0, v2], s[0:7] dmask:0x1 dim:SQ_RSRC_IMG_2D_MSAA unorm a16 ; encoding: [0x46,0x20,0x46,0xe4,0x00,0x00,0x00,0x00,0x00,0x02,0x00,0x00]
232
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
232
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
233
233
; GFX12-NEXT: ; return to shader part epilog
234
234
main_body:
235
235
%v = call <4 x float > @llvm.amdgcn.image.msaa.load.2dmsaa.v4f32.i16 (i32 1 , i16 %s , i16 %t , i16 %fragid , <8 x i32 > %rsrc , i32 0 , i32 0 )
@@ -250,7 +250,7 @@ define amdgpu_ps <4 x float> @load_2darraymsaa_a16(<8 x i32> inreg %rsrc, i16 %s
250
250
; GFX12-NEXT: v_perm_b32 v2, v3, v2, 0x5040100 ; encoding: [0x02,0x00,0x44,0xd6,0x03,0x05,0xfe,0x03,0x00,0x01,0x04,0x05]
251
251
; GFX12-NEXT: v_perm_b32 v0, v1, v0, 0x5040100 ; encoding: [0x00,0x00,0x44,0xd6,0x01,0x01,0xfe,0x03,0x00,0x01,0x04,0x05]
252
252
; GFX12-NEXT: image_msaa_load v[0:3], [v0, v2], s[0:7] dmask:0x4 dim:SQ_RSRC_IMG_2D_MSAA_ARRAY unorm a16 ; encoding: [0x47,0x20,0x06,0xe5,0x00,0x00,0x00,0x00,0x00,0x02,0x00,0x00]
253
- ; GFX12-NEXT: s_wait_loadcnt 0x0 ; encoding: [0x00,0x00,0xc0 ,0xbf]
253
+ ; GFX12-NEXT: s_wait_samplecnt 0x0 ; encoding: [0x00,0x00,0xc2 ,0xbf]
254
254
; GFX12-NEXT: ; return to shader part epilog
255
255
main_body:
256
256
%v = call <4 x float > @llvm.amdgcn.image.msaa.load.2darraymsaa.v4f32.i16 (i32 4 , i16 %s , i16 %t , i16 %slice , i16 %fragid , <8 x i32 > %rsrc , i32 0 , i32 0 )
0 commit comments