@@ -238,8 +238,6 @@ define amdgpu_kernel void @add_i32_constant(ptr addrspace(1) %out, ptr addrspace
238
238
; GFX1264-NEXT: s_waitcnt lgkmcnt(0)
239
239
; GFX1264-NEXT: s_mov_b32 s8, s2
240
240
; GFX1264-NEXT: s_mov_b32 s9, s3
241
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
242
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
243
241
; GFX1264-NEXT: buffer_atomic_add_u32 v1, off, s[8:11], null th:TH_ATOMIC_RETURN
244
242
; GFX1264-NEXT: s_waitcnt vmcnt(0)
245
243
; GFX1264-NEXT: buffer_gl0_inv
@@ -276,8 +274,6 @@ define amdgpu_kernel void @add_i32_constant(ptr addrspace(1) %out, ptr addrspace
276
274
; GFX1232-NEXT: s_waitcnt lgkmcnt(0)
277
275
; GFX1232-NEXT: s_mov_b32 s8, s2
278
276
; GFX1232-NEXT: s_mov_b32 s9, s3
279
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
280
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
281
277
; GFX1232-NEXT: buffer_atomic_add_u32 v1, off, s[8:11], null th:TH_ATOMIC_RETURN
282
278
; GFX1232-NEXT: s_waitcnt vmcnt(0)
283
279
; GFX1232-NEXT: buffer_gl0_inv
@@ -573,8 +569,6 @@ define amdgpu_kernel void @add_i32_uniform(ptr addrspace(1) %out, ptr addrspace(
573
569
; GFX1264-NEXT: v_mov_b32_e32 v1, s2
574
570
; GFX1264-NEXT: s_mov_b32 s12, s6
575
571
; GFX1264-NEXT: s_mov_b32 s13, s7
576
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
577
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
578
572
; GFX1264-NEXT: buffer_atomic_add_u32 v1, off, s[12:15], null th:TH_ATOMIC_RETURN
579
573
; GFX1264-NEXT: s_waitcnt vmcnt(0)
580
574
; GFX1264-NEXT: buffer_gl0_inv
@@ -614,8 +608,6 @@ define amdgpu_kernel void @add_i32_uniform(ptr addrspace(1) %out, ptr addrspace(
614
608
; GFX1232-NEXT: v_mov_b32_e32 v1, s2
615
609
; GFX1232-NEXT: s_mov_b32 s8, s6
616
610
; GFX1232-NEXT: s_mov_b32 s9, s7
617
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
618
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
619
611
; GFX1232-NEXT: buffer_atomic_add_u32 v1, off, s[8:11], null th:TH_ATOMIC_RETURN
620
612
; GFX1232-NEXT: s_waitcnt vmcnt(0)
621
613
; GFX1232-NEXT: buffer_gl0_inv
@@ -990,8 +982,6 @@ define amdgpu_kernel void @add_i32_varying(ptr addrspace(1) %out, ptr addrspace(
990
982
; GFX1264-NEXT: s_waitcnt lgkmcnt(0)
991
983
; GFX1264-NEXT: s_mov_b32 s8, s2
992
984
; GFX1264-NEXT: s_mov_b32 s9, s3
993
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
994
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
995
985
; GFX1264-NEXT: buffer_atomic_add_u32 v0, off, s[8:11], null th:TH_ATOMIC_RETURN
996
986
; GFX1264-NEXT: s_waitcnt vmcnt(0)
997
987
; GFX1264-NEXT: buffer_gl0_inv
@@ -1041,8 +1031,6 @@ define amdgpu_kernel void @add_i32_varying(ptr addrspace(1) %out, ptr addrspace(
1041
1031
; GFX1232-NEXT: s_waitcnt lgkmcnt(0)
1042
1032
; GFX1232-NEXT: s_mov_b32 s8, s2
1043
1033
; GFX1232-NEXT: s_mov_b32 s9, s3
1044
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1045
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
1046
1034
; GFX1232-NEXT: buffer_atomic_add_u32 v0, off, s[8:11], null th:TH_ATOMIC_RETURN
1047
1035
; GFX1232-NEXT: s_waitcnt vmcnt(0)
1048
1036
; GFX1232-NEXT: buffer_gl0_inv
@@ -1311,8 +1299,6 @@ define amdgpu_kernel void @add_i64_constant(ptr addrspace(1) %out, ptr addrspace
1311
1299
; GFX1264-NEXT: s_waitcnt lgkmcnt(0)
1312
1300
; GFX1264-NEXT: s_mov_b32 s8, s2
1313
1301
; GFX1264-NEXT: s_mov_b32 s9, s3
1314
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1315
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
1316
1302
; GFX1264-NEXT: buffer_atomic_add_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
1317
1303
; GFX1264-NEXT: s_waitcnt vmcnt(0)
1318
1304
; GFX1264-NEXT: buffer_gl0_inv
@@ -1350,8 +1336,6 @@ define amdgpu_kernel void @add_i64_constant(ptr addrspace(1) %out, ptr addrspace
1350
1336
; GFX1232-NEXT: s_waitcnt lgkmcnt(0)
1351
1337
; GFX1232-NEXT: s_mov_b32 s8, s2
1352
1338
; GFX1232-NEXT: s_mov_b32 s9, s3
1353
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1354
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
1355
1339
; GFX1232-NEXT: buffer_atomic_add_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
1356
1340
; GFX1232-NEXT: s_waitcnt vmcnt(0)
1357
1341
; GFX1232-NEXT: buffer_gl0_inv
@@ -1704,8 +1688,6 @@ define amdgpu_kernel void @add_i64_uniform(ptr addrspace(1) %out, ptr addrspace(
1704
1688
; GFX1264-NEXT: s_mov_b32 s10, -1
1705
1689
; GFX1264-NEXT: s_mov_b32 s8, s6
1706
1690
; GFX1264-NEXT: s_mov_b32 s9, s7
1707
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1708
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
1709
1691
; GFX1264-NEXT: buffer_atomic_add_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
1710
1692
; GFX1264-NEXT: s_waitcnt vmcnt(0)
1711
1693
; GFX1264-NEXT: buffer_gl0_inv
@@ -1751,8 +1733,6 @@ define amdgpu_kernel void @add_i64_uniform(ptr addrspace(1) %out, ptr addrspace(
1751
1733
; GFX1232-NEXT: s_mov_b32 s10, -1
1752
1734
; GFX1232-NEXT: s_mov_b32 s8, s6
1753
1735
; GFX1232-NEXT: s_mov_b32 s9, s7
1754
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1755
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
1756
1736
; GFX1232-NEXT: buffer_atomic_add_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
1757
1737
; GFX1232-NEXT: s_waitcnt vmcnt(0)
1758
1738
; GFX1232-NEXT: buffer_gl0_inv
@@ -1871,8 +1851,6 @@ define amdgpu_kernel void @add_i64_varying(ptr addrspace(1) %out, ptr addrspace(
1871
1851
; GFX12-NEXT: s_mov_b32 s8, s2
1872
1852
; GFX12-NEXT: s_mov_b32 s9, s3
1873
1853
; GFX12-NEXT: s_mov_b32 s4, s0
1874
- ; GFX12-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
1875
- ; GFX12-NEXT: s_waitcnt_vscnt null, 0x0
1876
1854
; GFX12-NEXT: buffer_atomic_add_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
1877
1855
; GFX12-NEXT: s_waitcnt vmcnt(0)
1878
1856
; GFX12-NEXT: buffer_gl0_inv
@@ -2154,8 +2132,6 @@ define amdgpu_kernel void @sub_i32_constant(ptr addrspace(1) %out, ptr addrspace
2154
2132
; GFX1264-NEXT: s_waitcnt lgkmcnt(0)
2155
2133
; GFX1264-NEXT: s_mov_b32 s8, s2
2156
2134
; GFX1264-NEXT: s_mov_b32 s9, s3
2157
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
2158
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
2159
2135
; GFX1264-NEXT: buffer_atomic_sub_u32 v1, off, s[8:11], null th:TH_ATOMIC_RETURN
2160
2136
; GFX1264-NEXT: s_waitcnt vmcnt(0)
2161
2137
; GFX1264-NEXT: buffer_gl0_inv
@@ -2193,8 +2169,6 @@ define amdgpu_kernel void @sub_i32_constant(ptr addrspace(1) %out, ptr addrspace
2193
2169
; GFX1232-NEXT: s_waitcnt lgkmcnt(0)
2194
2170
; GFX1232-NEXT: s_mov_b32 s8, s2
2195
2171
; GFX1232-NEXT: s_mov_b32 s9, s3
2196
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
2197
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
2198
2172
; GFX1232-NEXT: buffer_atomic_sub_u32 v1, off, s[8:11], null th:TH_ATOMIC_RETURN
2199
2173
; GFX1232-NEXT: s_waitcnt vmcnt(0)
2200
2174
; GFX1232-NEXT: buffer_gl0_inv
@@ -2495,8 +2469,6 @@ define amdgpu_kernel void @sub_i32_uniform(ptr addrspace(1) %out, ptr addrspace(
2495
2469
; GFX1264-NEXT: v_mov_b32_e32 v1, s2
2496
2470
; GFX1264-NEXT: s_mov_b32 s12, s6
2497
2471
; GFX1264-NEXT: s_mov_b32 s13, s7
2498
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
2499
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
2500
2472
; GFX1264-NEXT: buffer_atomic_sub_u32 v1, off, s[12:15], null th:TH_ATOMIC_RETURN
2501
2473
; GFX1264-NEXT: s_waitcnt vmcnt(0)
2502
2474
; GFX1264-NEXT: buffer_gl0_inv
@@ -2536,8 +2508,6 @@ define amdgpu_kernel void @sub_i32_uniform(ptr addrspace(1) %out, ptr addrspace(
2536
2508
; GFX1232-NEXT: v_mov_b32_e32 v1, s2
2537
2509
; GFX1232-NEXT: s_mov_b32 s8, s6
2538
2510
; GFX1232-NEXT: s_mov_b32 s9, s7
2539
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
2540
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
2541
2511
; GFX1232-NEXT: buffer_atomic_sub_u32 v1, off, s[8:11], null th:TH_ATOMIC_RETURN
2542
2512
; GFX1232-NEXT: s_waitcnt vmcnt(0)
2543
2513
; GFX1232-NEXT: buffer_gl0_inv
@@ -2912,8 +2882,6 @@ define amdgpu_kernel void @sub_i32_varying(ptr addrspace(1) %out, ptr addrspace(
2912
2882
; GFX1264-NEXT: s_waitcnt lgkmcnt(0)
2913
2883
; GFX1264-NEXT: s_mov_b32 s8, s2
2914
2884
; GFX1264-NEXT: s_mov_b32 s9, s3
2915
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
2916
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
2917
2885
; GFX1264-NEXT: buffer_atomic_sub_u32 v0, off, s[8:11], null th:TH_ATOMIC_RETURN
2918
2886
; GFX1264-NEXT: s_waitcnt vmcnt(0)
2919
2887
; GFX1264-NEXT: buffer_gl0_inv
@@ -2963,8 +2931,6 @@ define amdgpu_kernel void @sub_i32_varying(ptr addrspace(1) %out, ptr addrspace(
2963
2931
; GFX1232-NEXT: s_waitcnt lgkmcnt(0)
2964
2932
; GFX1232-NEXT: s_mov_b32 s8, s2
2965
2933
; GFX1232-NEXT: s_mov_b32 s9, s3
2966
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
2967
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
2968
2934
; GFX1232-NEXT: buffer_atomic_sub_u32 v0, off, s[8:11], null th:TH_ATOMIC_RETURN
2969
2935
; GFX1232-NEXT: s_waitcnt vmcnt(0)
2970
2936
; GFX1232-NEXT: buffer_gl0_inv
@@ -3284,8 +3250,6 @@ define amdgpu_kernel void @sub_i64_constant(ptr addrspace(1) %out, ptr addrspace
3284
3250
; GFX1264-NEXT: s_waitcnt lgkmcnt(0)
3285
3251
; GFX1264-NEXT: s_mov_b32 s8, s2
3286
3252
; GFX1264-NEXT: s_mov_b32 s9, s3
3287
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
3288
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
3289
3253
; GFX1264-NEXT: buffer_atomic_sub_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
3290
3254
; GFX1264-NEXT: s_waitcnt vmcnt(0)
3291
3255
; GFX1264-NEXT: buffer_gl0_inv
@@ -3326,8 +3290,6 @@ define amdgpu_kernel void @sub_i64_constant(ptr addrspace(1) %out, ptr addrspace
3326
3290
; GFX1232-NEXT: s_waitcnt lgkmcnt(0)
3327
3291
; GFX1232-NEXT: s_mov_b32 s8, s2
3328
3292
; GFX1232-NEXT: s_mov_b32 s9, s3
3329
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
3330
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
3331
3293
; GFX1232-NEXT: buffer_atomic_sub_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
3332
3294
; GFX1232-NEXT: s_waitcnt vmcnt(0)
3333
3295
; GFX1232-NEXT: buffer_gl0_inv
@@ -3696,8 +3658,6 @@ define amdgpu_kernel void @sub_i64_uniform(ptr addrspace(1) %out, ptr addrspace(
3696
3658
; GFX1264-NEXT: s_mov_b32 s10, -1
3697
3659
; GFX1264-NEXT: s_mov_b32 s8, s6
3698
3660
; GFX1264-NEXT: s_mov_b32 s9, s7
3699
- ; GFX1264-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
3700
- ; GFX1264-NEXT: s_waitcnt_vscnt null, 0x0
3701
3661
; GFX1264-NEXT: buffer_atomic_sub_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
3702
3662
; GFX1264-NEXT: s_waitcnt vmcnt(0)
3703
3663
; GFX1264-NEXT: buffer_gl0_inv
@@ -3746,8 +3706,6 @@ define amdgpu_kernel void @sub_i64_uniform(ptr addrspace(1) %out, ptr addrspace(
3746
3706
; GFX1232-NEXT: s_mov_b32 s10, -1
3747
3707
; GFX1232-NEXT: s_mov_b32 s8, s6
3748
3708
; GFX1232-NEXT: s_mov_b32 s9, s7
3749
- ; GFX1232-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
3750
- ; GFX1232-NEXT: s_waitcnt_vscnt null, 0x0
3751
3709
; GFX1232-NEXT: buffer_atomic_sub_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
3752
3710
; GFX1232-NEXT: s_waitcnt vmcnt(0)
3753
3711
; GFX1232-NEXT: buffer_gl0_inv
@@ -3869,8 +3827,6 @@ define amdgpu_kernel void @sub_i64_varying(ptr addrspace(1) %out, ptr addrspace(
3869
3827
; GFX12-NEXT: s_mov_b32 s8, s2
3870
3828
; GFX12-NEXT: s_mov_b32 s9, s3
3871
3829
; GFX12-NEXT: s_mov_b32 s4, s0
3872
- ; GFX12-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
3873
- ; GFX12-NEXT: s_waitcnt_vscnt null, 0x0
3874
3830
; GFX12-NEXT: buffer_atomic_sub_u64 v[0:1], off, s[8:11], null th:TH_ATOMIC_RETURN
3875
3831
; GFX12-NEXT: s_waitcnt vmcnt(0)
3876
3832
; GFX12-NEXT: buffer_gl0_inv
0 commit comments