@@ -117,7 +117,7 @@ define i32 @atomic_load_flat_monotonic_i16_zext_to_i32(ptr %ptr) {
117
117
; GCN-LABEL: atomic_load_flat_monotonic_i16_zext_to_i32:
118
118
; GCN: ; %bb.0:
119
119
; GCN-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
120
- ; GCN-NEXT: flat_load_ubyte v0, v[0:1] glc
120
+ ; GCN-NEXT: flat_load_ushort v0, v[0:1] glc
121
121
; GCN-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
122
122
; GCN-NEXT: s_setpc_b64 s[30:31]
123
123
%load = load atomic i16 , ptr %ptr monotonic , align 2
@@ -129,7 +129,7 @@ define i32 @atomic_load_flat_monotonic_i16_sext_to_i32(ptr %ptr) {
129
129
; GFX7-LABEL: atomic_load_flat_monotonic_i16_sext_to_i32:
130
130
; GFX7: ; %bb.0:
131
131
; GFX7-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
132
- ; GFX7-NEXT: flat_load_sbyte v2, v[0:1] glc
132
+ ; GFX7-NEXT: flat_load_sshort v2, v[0:1] glc
133
133
; GFX7-NEXT: flat_load_ushort v0, v[0:1] glc
134
134
; GFX7-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
135
135
; GFX7-NEXT: v_mov_b32_e32 v0, v2
@@ -138,7 +138,7 @@ define i32 @atomic_load_flat_monotonic_i16_sext_to_i32(ptr %ptr) {
138
138
; GFX8-LABEL: atomic_load_flat_monotonic_i16_sext_to_i32:
139
139
; GFX8: ; %bb.0:
140
140
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
141
- ; GFX8-NEXT: flat_load_sbyte v2, v[0:1] glc
141
+ ; GFX8-NEXT: flat_load_sshort v2, v[0:1] glc
142
142
; GFX8-NEXT: flat_load_ushort v0, v[0:1] glc
143
143
; GFX8-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
144
144
; GFX8-NEXT: v_mov_b32_e32 v0, v2
@@ -147,7 +147,7 @@ define i32 @atomic_load_flat_monotonic_i16_sext_to_i32(ptr %ptr) {
147
147
; GFX9-LABEL: atomic_load_flat_monotonic_i16_sext_to_i32:
148
148
; GFX9: ; %bb.0:
149
149
; GFX9-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
150
- ; GFX9-NEXT: flat_load_sbyte v2, v[0:1] glc
150
+ ; GFX9-NEXT: flat_load_sshort v2, v[0:1] glc
151
151
; GFX9-NEXT: flat_load_ushort v3, v[0:1] glc
152
152
; GFX9-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
153
153
; GFX9-NEXT: v_mov_b32_e32 v0, v2
@@ -183,7 +183,7 @@ define i32 @atomic_load_flat_monotonic_f16_zext_to_i32(ptr %ptr) {
183
183
; GCN-LABEL: atomic_load_flat_monotonic_f16_zext_to_i32:
184
184
; GCN: ; %bb.0:
185
185
; GCN-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
186
- ; GCN-NEXT: flat_load_ubyte v0, v[0:1] glc
186
+ ; GCN-NEXT: flat_load_ushort v0, v[0:1] glc
187
187
; GCN-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
188
188
; GCN-NEXT: s_setpc_b64 s[30:31]
189
189
%load = load atomic half , ptr %ptr monotonic , align 2
@@ -196,7 +196,7 @@ define i32 @atomic_load_flat_monotonic_bf16_zext_to_i32(ptr %ptr) {
196
196
; GCN-LABEL: atomic_load_flat_monotonic_bf16_zext_to_i32:
197
197
; GCN: ; %bb.0:
198
198
; GCN-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
199
- ; GCN-NEXT: flat_load_ubyte v0, v[0:1] glc
199
+ ; GCN-NEXT: flat_load_ushort v0, v[0:1] glc
200
200
; GCN-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
201
201
; GCN-NEXT: s_setpc_b64 s[30:31]
202
202
%load = load atomic bfloat, ptr %ptr monotonic , align 2
@@ -209,7 +209,7 @@ define i32 @atomic_load_flat_monotonic_i16_d16_hi_shift(ptr %ptr) {
209
209
; GCN-LABEL: atomic_load_flat_monotonic_i16_d16_hi_shift:
210
210
; GCN: ; %bb.0:
211
211
; GCN-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
212
- ; GCN-NEXT: flat_load_ubyte v0, v[0:1] glc
212
+ ; GCN-NEXT: flat_load_ushort v0, v[0:1] glc
213
213
; GCN-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
214
214
; GCN-NEXT: v_lshlrev_b32_e32 v0, 16, v0
215
215
; GCN-NEXT: s_setpc_b64 s[30:31]
@@ -223,7 +223,7 @@ define <2 x i16> @atomic_load_flat_monotonic_i16_d16_hi_vector_insert(ptr %ptr,
223
223
; GFX7-LABEL: atomic_load_flat_monotonic_i16_d16_hi_vector_insert:
224
224
; GFX7: ; %bb.0:
225
225
; GFX7-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
226
- ; GFX7-NEXT: flat_load_ubyte v0, v[0:1] glc
226
+ ; GFX7-NEXT: flat_load_ushort v0, v[0:1] glc
227
227
; GFX7-NEXT: v_lshlrev_b32_e32 v1, 16, v3
228
228
; GFX7-NEXT: v_and_b32_e32 v2, 0xffff, v2
229
229
; GFX7-NEXT: v_or_b32_e32 v1, v1, v2
@@ -237,7 +237,7 @@ define <2 x i16> @atomic_load_flat_monotonic_i16_d16_hi_vector_insert(ptr %ptr,
237
237
; GFX8-LABEL: atomic_load_flat_monotonic_i16_d16_hi_vector_insert:
238
238
; GFX8: ; %bb.0:
239
239
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
240
- ; GFX8-NEXT: flat_load_ubyte v0, v[0:1] glc
240
+ ; GFX8-NEXT: flat_load_ushort v0, v[0:1] glc
241
241
; GFX8-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
242
242
; GFX8-NEXT: v_lshlrev_b32_e32 v0, 16, v0
243
243
; GFX8-NEXT: v_or_b32_sdwa v0, v2, v0 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_0 src1_sel:DWORD
@@ -246,7 +246,7 @@ define <2 x i16> @atomic_load_flat_monotonic_i16_d16_hi_vector_insert(ptr %ptr,
246
246
; GFX9-LABEL: atomic_load_flat_monotonic_i16_d16_hi_vector_insert:
247
247
; GFX9: ; %bb.0:
248
248
; GFX9-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
249
- ; GFX9-NEXT: flat_load_ubyte v0, v[0:1] glc
249
+ ; GFX9-NEXT: flat_load_ushort v0, v[0:1] glc
250
250
; GFX9-NEXT: v_mov_b32_e32 v1, 0xffff
251
251
; GFX9-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
252
252
; GFX9-NEXT: v_lshlrev_b32_e32 v0, 16, v0
@@ -261,7 +261,7 @@ define i32 @atomic_load_flat_monotonic_i16_d16_lo_or(ptr %ptr, i16 %high) {
261
261
; GFX7-LABEL: atomic_load_flat_monotonic_i16_d16_lo_or:
262
262
; GFX7: ; %bb.0:
263
263
; GFX7-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
264
- ; GFX7-NEXT: flat_load_ubyte v0, v[0:1] glc
264
+ ; GFX7-NEXT: flat_load_ushort v0, v[0:1] glc
265
265
; GFX7-NEXT: v_and_b32_e32 v1, 0xffff, v2
266
266
; GFX7-NEXT: v_lshlrev_b32_e32 v1, 16, v1
267
267
; GFX7-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
@@ -271,7 +271,7 @@ define i32 @atomic_load_flat_monotonic_i16_d16_lo_or(ptr %ptr, i16 %high) {
271
271
; GFX8-LABEL: atomic_load_flat_monotonic_i16_d16_lo_or:
272
272
; GFX8: ; %bb.0:
273
273
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
274
- ; GFX8-NEXT: flat_load_ubyte v0, v[0:1] glc
274
+ ; GFX8-NEXT: flat_load_ushort v0, v[0:1] glc
275
275
; GFX8-NEXT: v_and_b32_e32 v1, 0xffff, v2
276
276
; GFX8-NEXT: v_lshlrev_b32_e32 v1, 16, v1
277
277
; GFX8-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
@@ -281,7 +281,7 @@ define i32 @atomic_load_flat_monotonic_i16_d16_lo_or(ptr %ptr, i16 %high) {
281
281
; GFX9-LABEL: atomic_load_flat_monotonic_i16_d16_lo_or:
282
282
; GFX9: ; %bb.0:
283
283
; GFX9-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
284
- ; GFX9-NEXT: flat_load_ubyte v0, v[0:1] glc
284
+ ; GFX9-NEXT: flat_load_ushort v0, v[0:1] glc
285
285
; GFX9-NEXT: v_and_b32_e32 v1, 0xffff, v2
286
286
; GFX9-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
287
287
; GFX9-NEXT: v_lshl_or_b32 v0, v1, 16, v0
@@ -298,7 +298,7 @@ define <2 x i16> @atomic_load_flat_monotonic_i16_d16_lo_vector_insert(ptr %ptr,
298
298
; GFX7-LABEL: atomic_load_flat_monotonic_i16_d16_lo_vector_insert:
299
299
; GFX7: ; %bb.0:
300
300
; GFX7-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
301
- ; GFX7-NEXT: flat_load_ubyte v0, v[0:1] glc
301
+ ; GFX7-NEXT: flat_load_ushort v0, v[0:1] glc
302
302
; GFX7-NEXT: v_lshlrev_b32_e32 v1, 16, v3
303
303
; GFX7-NEXT: v_and_b32_e32 v2, 0xffff, v2
304
304
; GFX7-NEXT: v_or_b32_e32 v1, v1, v2
@@ -311,7 +311,7 @@ define <2 x i16> @atomic_load_flat_monotonic_i16_d16_lo_vector_insert(ptr %ptr,
311
311
; GFX8-LABEL: atomic_load_flat_monotonic_i16_d16_lo_vector_insert:
312
312
; GFX8: ; %bb.0:
313
313
; GFX8-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
314
- ; GFX8-NEXT: flat_load_ubyte v0, v[0:1] glc
314
+ ; GFX8-NEXT: flat_load_ushort v0, v[0:1] glc
315
315
; GFX8-NEXT: v_and_b32_e32 v1, 0xffff0000, v2
316
316
; GFX8-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
317
317
; GFX8-NEXT: v_or_b32_e32 v0, v1, v0
@@ -320,7 +320,7 @@ define <2 x i16> @atomic_load_flat_monotonic_i16_d16_lo_vector_insert(ptr %ptr,
320
320
; GFX9-LABEL: atomic_load_flat_monotonic_i16_d16_lo_vector_insert:
321
321
; GFX9: ; %bb.0:
322
322
; GFX9-NEXT: s_waitcnt vmcnt(0) expcnt(0) lgkmcnt(0)
323
- ; GFX9-NEXT: flat_load_ubyte v0, v[0:1] glc
323
+ ; GFX9-NEXT: flat_load_ushort v0, v[0:1] glc
324
324
; GFX9-NEXT: v_mov_b32_e32 v1, 0xffff0000
325
325
; GFX9-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
326
326
; GFX9-NEXT: v_and_or_b32 v0, v2, v1, v0
0 commit comments