@@ -147,7 +147,7 @@ define amdgpu_ps void @global_atomic_fadd_f32_no_rtn_atomicrmw(ptr addrspace(1)
147
147
define amdgpu_ps void @global_atomic_fadd_f32_saddr_no_rtn_atomicrmw (ptr addrspace (1 ) inreg %ptr , float %data ) #0 {
148
148
; GFX90A_GFX940-LABEL: name: global_atomic_fadd_f32_saddr_no_rtn_atomicrmw
149
149
; GFX90A_GFX940: bb.0 (%ir-block.0):
150
- ; GFX90A_GFX940-NEXT: successors: %bb.1(0x40000000), %bb.3 (0x40000000)
150
+ ; GFX90A_GFX940-NEXT: successors: %bb.1(0x40000000), %bb.4 (0x40000000)
151
151
; GFX90A_GFX940-NEXT: liveins: $sgpr0, $sgpr1, $vgpr0
152
152
; GFX90A_GFX940-NEXT: {{ $}}
153
153
; GFX90A_GFX940-NEXT: [[PRED_COPY:%[0-9]+]]:vgpr_32 = PRED_COPY $vgpr0
@@ -156,11 +156,11 @@ define amdgpu_ps void @global_atomic_fadd_f32_saddr_no_rtn_atomicrmw(ptr addrspa
156
156
; GFX90A_GFX940-NEXT: [[REG_SEQUENCE:%[0-9]+]]:sgpr_64 = REG_SEQUENCE [[PRED_COPY2]], %subreg.sub0, [[PRED_COPY1]], %subreg.sub1
157
157
; GFX90A_GFX940-NEXT: [[PRED_COPY3:%[0-9]+]]:sreg_64 = PRED_COPY [[REG_SEQUENCE]]
158
158
; GFX90A_GFX940-NEXT: [[SI_PS_LIVE:%[0-9]+]]:sreg_64 = SI_PS_LIVE
159
- ; GFX90A_GFX940-NEXT: [[SI_IF:%[0-9]+]]:sreg_64 = SI_IF killed [[SI_PS_LIVE]], %bb.3 , implicit-def dead $exec, implicit-def dead $scc, implicit $exec
159
+ ; GFX90A_GFX940-NEXT: [[SI_IF:%[0-9]+]]:sreg_64 = SI_IF killed [[SI_PS_LIVE]], %bb.4 , implicit-def dead $exec, implicit-def dead $scc, implicit $exec
160
160
; GFX90A_GFX940-NEXT: S_BRANCH %bb.1
161
161
; GFX90A_GFX940-NEXT: {{ $}}
162
162
; GFX90A_GFX940-NEXT: bb.1 (%ir-block.5):
163
- ; GFX90A_GFX940-NEXT: successors: %bb.2(0x40000000), %bb.4 (0x40000000)
163
+ ; GFX90A_GFX940-NEXT: successors: %bb.2(0x40000000), %bb.3 (0x40000000)
164
164
; GFX90A_GFX940-NEXT: {{ $}}
165
165
; GFX90A_GFX940-NEXT: [[PRED_COPY4:%[0-9]+]]:sreg_64 = PRED_COPY $exec
166
166
; GFX90A_GFX940-NEXT: [[PRED_COPY5:%[0-9]+]]:sreg_32 = PRED_COPY [[PRED_COPY4]].sub1
@@ -188,30 +188,23 @@ define amdgpu_ps void @global_atomic_fadd_f32_saddr_no_rtn_atomicrmw(ptr addrspa
188
188
; GFX90A_GFX940-NEXT: [[V_READLANE_B32_:%[0-9]+]]:sreg_32 = V_READLANE_B32 killed [[V_ADD_F32_e64_5]], killed [[S_MOV_B32_2]]
189
189
; GFX90A_GFX940-NEXT: early-clobber %1:sgpr_32 = STRICT_WWM killed [[V_READLANE_B32_]], implicit $exec
190
190
; GFX90A_GFX940-NEXT: [[V_CMP_EQ_U32_e64_:%[0-9]+]]:sreg_64 = V_CMP_EQ_U32_e64 killed [[V_MBCNT_HI_U32_B32_e64_]], [[S_MOV_B32_]], implicit $exec
191
- ; GFX90A_GFX940-NEXT: [[SI_IF1:%[0-9]+]]:sreg_64 = SI_IF killed [[V_CMP_EQ_U32_e64_]], %bb.4 , implicit-def dead $exec, implicit-def dead $scc, implicit $exec
191
+ ; GFX90A_GFX940-NEXT: [[SI_IF1:%[0-9]+]]:sreg_64 = SI_IF killed [[V_CMP_EQ_U32_e64_]], %bb.3 , implicit-def dead $exec, implicit-def dead $scc, implicit $exec
192
192
; GFX90A_GFX940-NEXT: S_BRANCH %bb.2
193
193
; GFX90A_GFX940-NEXT: {{ $}}
194
- ; GFX90A_GFX940-NEXT: bb.2 (%ir-block.36 ):
195
- ; GFX90A_GFX940-NEXT: successors: %bb.4 (0x80000000)
194
+ ; GFX90A_GFX940-NEXT: bb.2 (%ir-block.35 ):
195
+ ; GFX90A_GFX940-NEXT: successors: %bb.3 (0x80000000)
196
196
; GFX90A_GFX940-NEXT: {{ $}}
197
197
; GFX90A_GFX940-NEXT: [[V_MOV_B32_e32_1:%[0-9]+]]:vgpr_32 = V_MOV_B32_e32 0, implicit $exec
198
198
; GFX90A_GFX940-NEXT: [[PRED_COPY8:%[0-9]+]]:vgpr_32 = PRED_COPY %1
199
199
; GFX90A_GFX940-NEXT: GLOBAL_ATOMIC_ADD_F32_SADDR killed [[V_MOV_B32_e32_1]], [[PRED_COPY8]], [[PRED_COPY3]], 0, 0, implicit $exec :: (load store syncscope("wavefront") monotonic (s32) on %ir.ptr, addrspace 1)
200
- ; GFX90A_GFX940-NEXT: S_BRANCH %bb.4
201
200
; GFX90A_GFX940-NEXT: {{ $}}
202
201
; GFX90A_GFX940-NEXT: bb.3.Flow:
203
- ; GFX90A_GFX940-NEXT: successors: %bb.5(0x80000000)
204
- ; GFX90A_GFX940-NEXT: {{ $}}
205
- ; GFX90A_GFX940-NEXT: SI_END_CF [[SI_IF]], implicit-def dead $exec, implicit-def dead $scc, implicit $exec
206
- ; GFX90A_GFX940-NEXT: S_BRANCH %bb.5
207
- ; GFX90A_GFX940-NEXT: {{ $}}
208
- ; GFX90A_GFX940-NEXT: bb.4 (%ir-block.38):
209
- ; GFX90A_GFX940-NEXT: successors: %bb.3(0x80000000)
202
+ ; GFX90A_GFX940-NEXT: successors: %bb.4(0x80000000)
210
203
; GFX90A_GFX940-NEXT: {{ $}}
211
204
; GFX90A_GFX940-NEXT: SI_END_CF [[SI_IF1]], implicit-def dead $exec, implicit-def dead $scc, implicit $exec
212
- ; GFX90A_GFX940-NEXT: S_BRANCH %bb.3
213
205
; GFX90A_GFX940-NEXT: {{ $}}
214
- ; GFX90A_GFX940-NEXT: bb.5 (%ir-block.39):
206
+ ; GFX90A_GFX940-NEXT: bb.4 (%ir-block.37):
207
+ ; GFX90A_GFX940-NEXT: SI_END_CF [[SI_IF]], implicit-def dead $exec, implicit-def dead $scc, implicit $exec
215
208
; GFX90A_GFX940-NEXT: S_ENDPGM 0
216
209
%ret = atomicrmw fadd ptr addrspace (1 ) %ptr , float %data syncscope("wavefront" ) monotonic
217
210
ret void
0 commit comments