@@ -54,7 +54,7 @@ define amdgpu_ps void @raw_buffer_atomic_add_rtn_f64(<4 x i32> inreg %rsrc, doub
54
54
; GFX942: ; %bb.0: ; %main_body
55
55
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 0 offen sc0
56
56
; GFX942-NEXT: s_waitcnt vmcnt(0)
57
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
57
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
58
58
; GFX942-NEXT: s_endpgm
59
59
main_body:
60
60
%ret = call double @llvm.amdgcn.raw.buffer.atomic.fadd.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 0 , i32 0 )
@@ -90,7 +90,7 @@ define amdgpu_kernel void @raw_buffer_atomic_add_rtn_f64_off4_slc(<4 x i32> %rsr
90
90
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 4 offen sc0 nt
91
91
; GFX942-NEXT: v_mov_b32_e32 v2, 0
92
92
; GFX942-NEXT: s_waitcnt vmcnt(0)
93
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
93
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
94
94
; GFX942-NEXT: s_endpgm
95
95
main_body:
96
96
%ret = call double @llvm.amdgcn.raw.buffer.atomic.fadd.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 4 , i32 2 )
@@ -137,7 +137,7 @@ define amdgpu_ps void @raw_ptr_buffer_atomic_add_rtn_f64(ptr addrspace(8) inreg
137
137
; GFX942: ; %bb.0: ; %main_body
138
138
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 0 offen sc0
139
139
; GFX942-NEXT: s_waitcnt vmcnt(0)
140
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
140
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
141
141
; GFX942-NEXT: s_endpgm
142
142
main_body:
143
143
%ret = call double @llvm.amdgcn.raw.ptr.buffer.atomic.fadd.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 0 , i32 0 )
@@ -173,7 +173,7 @@ define amdgpu_kernel void @raw_ptr_buffer_atomic_add_rtn_f64_off4_slc(ptr addrsp
173
173
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 4 offen sc0 nt
174
174
; GFX942-NEXT: v_mov_b32_e32 v2, 0
175
175
; GFX942-NEXT: s_waitcnt vmcnt(0)
176
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
176
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
177
177
; GFX942-NEXT: s_endpgm
178
178
main_body:
179
179
%ret = call double @llvm.amdgcn.raw.ptr.buffer.atomic.fadd.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 4 , i32 2 )
@@ -220,7 +220,7 @@ define amdgpu_ps void @struct_buffer_atomic_add_rtn_f64(<4 x i32> inreg %rsrc, d
220
220
; GFX942: ; %bb.0: ; %main_body
221
221
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 0 idxen sc0
222
222
; GFX942-NEXT: s_waitcnt vmcnt(0)
223
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
223
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
224
224
; GFX942-NEXT: s_endpgm
225
225
main_body:
226
226
%ret = call double @llvm.amdgcn.struct.buffer.atomic.fadd.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 0 , i32 0 , i32 0 )
@@ -256,7 +256,7 @@ define amdgpu_kernel void @struct_buffer_atomic_add_rtn_f64_off4_slc(<4 x i32> %
256
256
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 0 idxen offset:4 sc0 nt
257
257
; GFX942-NEXT: v_mov_b32_e32 v2, 0
258
258
; GFX942-NEXT: s_waitcnt vmcnt(0)
259
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
259
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
260
260
; GFX942-NEXT: s_endpgm
261
261
main_body:
262
262
%ret = call double @llvm.amdgcn.struct.buffer.atomic.fadd.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 4 , i32 0 , i32 2 )
@@ -303,7 +303,7 @@ define amdgpu_ps void @struct_ptr_buffer_atomic_add_rtn_f64(ptr addrspace(8) inr
303
303
; GFX942: ; %bb.0: ; %main_body
304
304
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 0 idxen sc0
305
305
; GFX942-NEXT: s_waitcnt vmcnt(0)
306
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
306
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
307
307
; GFX942-NEXT: s_endpgm
308
308
main_body:
309
309
%ret = call double @llvm.amdgcn.struct.ptr.buffer.atomic.fadd.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 0 , i32 0 , i32 0 )
@@ -339,7 +339,7 @@ define amdgpu_kernel void @struct_ptr_buffer_atomic_add_rtn_f64_off4_slc(ptr add
339
339
; GFX942-NEXT: buffer_atomic_add_f64 v[0:1], v2, s[0:3], 0 idxen offset:4 sc0 nt
340
340
; GFX942-NEXT: v_mov_b32_e32 v2, 0
341
341
; GFX942-NEXT: s_waitcnt vmcnt(0)
342
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
342
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
343
343
; GFX942-NEXT: s_endpgm
344
344
main_body:
345
345
%ret = call double @llvm.amdgcn.struct.ptr.buffer.atomic.fadd.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 4 , i32 0 , i32 2 )
@@ -386,7 +386,7 @@ define amdgpu_ps void @raw_buffer_atomic_min_rtn_f64(<4 x i32> inreg %rsrc, doub
386
386
; GFX942: ; %bb.0: ; %main_body
387
387
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 0 offen sc0
388
388
; GFX942-NEXT: s_waitcnt vmcnt(0)
389
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
389
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
390
390
; GFX942-NEXT: s_endpgm
391
391
main_body:
392
392
%ret = call double @llvm.amdgcn.raw.buffer.atomic.fmin.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 0 , i32 0 )
@@ -422,7 +422,7 @@ define amdgpu_kernel void @raw_buffer_atomic_min_rtn_f64_off4_slc(<4 x i32> %rsr
422
422
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 4 offen sc0 nt
423
423
; GFX942-NEXT: v_mov_b32_e32 v2, 0
424
424
; GFX942-NEXT: s_waitcnt vmcnt(0)
425
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
425
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
426
426
; GFX942-NEXT: s_endpgm
427
427
main_body:
428
428
%ret = call double @llvm.amdgcn.raw.buffer.atomic.fmin.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 4 , i32 2 )
@@ -469,7 +469,7 @@ define amdgpu_ps void @raw_ptr_buffer_atomic_min_rtn_f64(ptr addrspace(8) inreg
469
469
; GFX942: ; %bb.0: ; %main_body
470
470
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 0 offen sc0
471
471
; GFX942-NEXT: s_waitcnt vmcnt(0)
472
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
472
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
473
473
; GFX942-NEXT: s_endpgm
474
474
main_body:
475
475
%ret = call double @llvm.amdgcn.raw.ptr.buffer.atomic.fmin.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 0 , i32 0 )
@@ -505,7 +505,7 @@ define amdgpu_kernel void @raw_ptr_buffer_atomic_min_rtn_f64_off4_slc(ptr addrsp
505
505
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 4 offen sc0 nt
506
506
; GFX942-NEXT: v_mov_b32_e32 v2, 0
507
507
; GFX942-NEXT: s_waitcnt vmcnt(0)
508
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
508
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
509
509
; GFX942-NEXT: s_endpgm
510
510
main_body:
511
511
%ret = call double @llvm.amdgcn.raw.ptr.buffer.atomic.fmin.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 4 , i32 2 )
@@ -552,7 +552,7 @@ define amdgpu_ps void @struct_buffer_atomic_min_rtn_f64(<4 x i32> inreg %rsrc, d
552
552
; GFX942: ; %bb.0: ; %main_body
553
553
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 0 idxen sc0
554
554
; GFX942-NEXT: s_waitcnt vmcnt(0)
555
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
555
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
556
556
; GFX942-NEXT: s_endpgm
557
557
main_body:
558
558
%ret = call double @llvm.amdgcn.struct.buffer.atomic.fmin.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 0 , i32 0 , i32 0 )
@@ -588,7 +588,7 @@ define amdgpu_kernel void @struct_buffer_atomic_min_rtn_f64_off4_slc(<4 x i32> %
588
588
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 0 idxen offset:4 sc0 nt
589
589
; GFX942-NEXT: v_mov_b32_e32 v2, 0
590
590
; GFX942-NEXT: s_waitcnt vmcnt(0)
591
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
591
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
592
592
; GFX942-NEXT: s_endpgm
593
593
main_body:
594
594
%ret = call double @llvm.amdgcn.struct.buffer.atomic.fmin.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 4 , i32 0 , i32 2 )
@@ -635,7 +635,7 @@ define amdgpu_ps void @struct_ptr_buffer_atomic_min_rtn_f64(ptr addrspace(8) inr
635
635
; GFX942: ; %bb.0: ; %main_body
636
636
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 0 idxen sc0
637
637
; GFX942-NEXT: s_waitcnt vmcnt(0)
638
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
638
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
639
639
; GFX942-NEXT: s_endpgm
640
640
main_body:
641
641
%ret = call double @llvm.amdgcn.struct.ptr.buffer.atomic.fmin.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 0 , i32 0 , i32 0 )
@@ -671,7 +671,7 @@ define amdgpu_kernel void @struct_ptr_buffer_atomic_min_rtn_f64_off4_slc(ptr add
671
671
; GFX942-NEXT: buffer_atomic_min_f64 v[0:1], v2, s[0:3], 0 idxen offset:4 sc0 nt
672
672
; GFX942-NEXT: v_mov_b32_e32 v2, 0
673
673
; GFX942-NEXT: s_waitcnt vmcnt(0)
674
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
674
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
675
675
; GFX942-NEXT: s_endpgm
676
676
main_body:
677
677
%ret = call double @llvm.amdgcn.struct.ptr.buffer.atomic.fmin.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 4 , i32 0 , i32 2 )
@@ -718,7 +718,7 @@ define amdgpu_ps void @raw_buffer_atomic_max_rtn_f64(<4 x i32> inreg %rsrc, doub
718
718
; GFX942: ; %bb.0: ; %main_body
719
719
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 0 offen sc0
720
720
; GFX942-NEXT: s_waitcnt vmcnt(0)
721
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
721
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
722
722
; GFX942-NEXT: s_endpgm
723
723
main_body:
724
724
%ret = call double @llvm.amdgcn.raw.buffer.atomic.fmax.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 0 , i32 0 )
@@ -754,7 +754,7 @@ define amdgpu_kernel void @raw_buffer_atomic_max_rtn_f64_off4_slc(<4 x i32> %rsr
754
754
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 4 offen sc0 nt
755
755
; GFX942-NEXT: v_mov_b32_e32 v2, 0
756
756
; GFX942-NEXT: s_waitcnt vmcnt(0)
757
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
757
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
758
758
; GFX942-NEXT: s_endpgm
759
759
main_body:
760
760
%ret = call double @llvm.amdgcn.raw.buffer.atomic.fmax.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 4 , i32 2 )
@@ -801,7 +801,7 @@ define amdgpu_ps void @raw_ptr_buffer_atomic_max_rtn_f64(ptr addrspace(8) inreg
801
801
; GFX942: ; %bb.0: ; %main_body
802
802
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 0 offen sc0
803
803
; GFX942-NEXT: s_waitcnt vmcnt(0)
804
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
804
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
805
805
; GFX942-NEXT: s_endpgm
806
806
main_body:
807
807
%ret = call double @llvm.amdgcn.raw.ptr.buffer.atomic.fmax.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 0 , i32 0 )
@@ -837,7 +837,7 @@ define amdgpu_kernel void @raw_ptr_buffer_atomic_max_rtn_f64_off4_slc(ptr addrsp
837
837
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 4 offen sc0 nt
838
838
; GFX942-NEXT: v_mov_b32_e32 v2, 0
839
839
; GFX942-NEXT: s_waitcnt vmcnt(0)
840
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
840
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
841
841
; GFX942-NEXT: s_endpgm
842
842
main_body:
843
843
%ret = call double @llvm.amdgcn.raw.ptr.buffer.atomic.fmax.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 4 , i32 2 )
@@ -884,7 +884,7 @@ define amdgpu_ps void @struct_buffer_atomic_max_rtn_f64(<4 x i32> inreg %rsrc, d
884
884
; GFX942: ; %bb.0: ; %main_body
885
885
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 0 idxen sc0
886
886
; GFX942-NEXT: s_waitcnt vmcnt(0)
887
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
887
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
888
888
; GFX942-NEXT: s_endpgm
889
889
main_body:
890
890
%ret = call double @llvm.amdgcn.struct.buffer.atomic.fmax.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 0 , i32 0 , i32 0 )
@@ -920,7 +920,7 @@ define amdgpu_kernel void @struct_buffer_atomic_max_rtn_f64_off4_slc(<4 x i32> %
920
920
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 0 idxen offset:4 sc0 nt
921
921
; GFX942-NEXT: v_mov_b32_e32 v2, 0
922
922
; GFX942-NEXT: s_waitcnt vmcnt(0)
923
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
923
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
924
924
; GFX942-NEXT: s_endpgm
925
925
main_body:
926
926
%ret = call double @llvm.amdgcn.struct.buffer.atomic.fmax.f64 (double %data , <4 x i32 > %rsrc , i32 %vindex , i32 4 , i32 0 , i32 2 )
@@ -967,7 +967,7 @@ define amdgpu_ps void @struct_ptr_buffer_atomic_max_rtn_f64(ptr addrspace(8) inr
967
967
; GFX942: ; %bb.0: ; %main_body
968
968
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 0 idxen sc0
969
969
; GFX942-NEXT: s_waitcnt vmcnt(0)
970
- ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1] sc0 sc1
970
+ ; GFX942-NEXT: flat_store_dwordx2 v[0:1], v[0:1]
971
971
; GFX942-NEXT: s_endpgm
972
972
main_body:
973
973
%ret = call double @llvm.amdgcn.struct.ptr.buffer.atomic.fmax.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 0 , i32 0 , i32 0 )
@@ -1003,7 +1003,7 @@ define amdgpu_kernel void @struct_ptr_buffer_atomic_max_rtn_f64_off4_slc(ptr add
1003
1003
; GFX942-NEXT: buffer_atomic_max_f64 v[0:1], v2, s[0:3], 0 idxen offset:4 sc0 nt
1004
1004
; GFX942-NEXT: v_mov_b32_e32 v2, 0
1005
1005
; GFX942-NEXT: s_waitcnt vmcnt(0)
1006
- ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9] sc0 sc1
1006
+ ; GFX942-NEXT: global_store_dwordx2 v2, v[0:1], s[8:9]
1007
1007
; GFX942-NEXT: s_endpgm
1008
1008
main_body:
1009
1009
%ret = call double @llvm.amdgcn.struct.ptr.buffer.atomic.fmax.f64 (double %data , ptr addrspace (8 ) %rsrc , i32 %vindex , i32 4 , i32 0 , i32 2 )
0 commit comments