@@ -30,19 +30,19 @@ define amdgpu_cs void @max_6_vgprs(ptr addrspace(1) %p) "amdgpu-num-vgpr"="6" {
30
30
; CHECK-NEXT: ;;#ASMEND
31
31
; CHECK-NEXT: global_store_b32 v[0:1], v5, off th:TH_STORE_NT_RT
32
32
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
33
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:4 ; 4-byte Folded Reload
33
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:4 th:TH_LOAD_LU ; 4-byte Folded Reload
34
34
; CHECK-NEXT: s_waitcnt vmcnt(0)
35
35
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
36
36
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
37
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:8 ; 4-byte Folded Reload
37
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:8 th:TH_LOAD_LU ; 4-byte Folded Reload
38
38
; CHECK-NEXT: s_waitcnt vmcnt(0)
39
39
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
40
40
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
41
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:12 ; 4-byte Folded Reload
41
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:12 th:TH_LOAD_LU ; 4-byte Folded Reload
42
42
; CHECK-NEXT: s_waitcnt vmcnt(0)
43
43
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
44
44
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
45
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:16 ; 4-byte Folded Reload
45
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:16 th:TH_LOAD_LU ; 4-byte Folded Reload
46
46
; CHECK-NEXT: s_waitcnt vmcnt(0)
47
47
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
48
48
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
@@ -118,31 +118,31 @@ define amdgpu_cs void @max_11_vgprs_branch(ptr addrspace(1) %p, i32 %tmp) "amdgp
118
118
; CHECK-NEXT: ;;#ASMEND
119
119
; CHECK-NEXT: global_store_b32 v[0:1], v10, off th:TH_STORE_NT_RT
120
120
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
121
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:20 ; 4-byte Folded Reload
121
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:20 th:TH_LOAD_LU ; 4-byte Folded Reload
122
122
; CHECK-NEXT: s_waitcnt vmcnt(0)
123
123
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
124
124
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
125
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:24 ; 4-byte Folded Reload
125
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:24 th:TH_LOAD_LU ; 4-byte Folded Reload
126
126
; CHECK-NEXT: s_waitcnt vmcnt(0)
127
127
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
128
128
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
129
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:28 ; 4-byte Folded Reload
129
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:28 th:TH_LOAD_LU ; 4-byte Folded Reload
130
130
; CHECK-NEXT: s_waitcnt vmcnt(0)
131
131
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
132
132
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
133
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:32 ; 4-byte Folded Reload
133
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:32 th:TH_LOAD_LU ; 4-byte Folded Reload
134
134
; CHECK-NEXT: s_waitcnt vmcnt(0)
135
135
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
136
136
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
137
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:36 ; 4-byte Folded Reload
137
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:36 th:TH_LOAD_LU ; 4-byte Folded Reload
138
138
; CHECK-NEXT: s_waitcnt vmcnt(0)
139
139
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
140
140
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
141
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:12 ; 4-byte Folded Reload
141
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:12 th:TH_LOAD_LU ; 4-byte Folded Reload
142
142
; CHECK-NEXT: s_waitcnt vmcnt(0)
143
143
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
144
144
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
145
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:16 ; 4-byte Folded Reload
145
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:16 th:TH_LOAD_LU ; 4-byte Folded Reload
146
146
; CHECK-NEXT: s_waitcnt vmcnt(0)
147
147
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
148
148
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
@@ -176,41 +176,41 @@ define amdgpu_cs void @max_11_vgprs_branch(ptr addrspace(1) %p, i32 %tmp) "amdgp
176
176
; CHECK-NEXT: ;;#ASMEND
177
177
; CHECK-NEXT: global_store_b32 v[0:1], v10, off th:TH_STORE_NT_RT
178
178
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
179
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:20 ; 4-byte Folded Reload
179
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:20 th:TH_LOAD_LU ; 4-byte Folded Reload
180
180
; CHECK-NEXT: s_waitcnt vmcnt(0)
181
181
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
182
182
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
183
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:24 ; 4-byte Folded Reload
183
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:24 th:TH_LOAD_LU ; 4-byte Folded Reload
184
184
; CHECK-NEXT: s_waitcnt vmcnt(0)
185
185
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
186
186
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
187
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:28 ; 4-byte Folded Reload
187
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:28 th:TH_LOAD_LU ; 4-byte Folded Reload
188
188
; CHECK-NEXT: s_waitcnt vmcnt(0)
189
189
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
190
190
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
191
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:32 ; 4-byte Folded Reload
191
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:32 th:TH_LOAD_LU ; 4-byte Folded Reload
192
192
; CHECK-NEXT: s_waitcnt vmcnt(0)
193
193
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
194
194
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
195
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:36 ; 4-byte Folded Reload
195
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:36 th:TH_LOAD_LU ; 4-byte Folded Reload
196
196
; CHECK-NEXT: s_waitcnt vmcnt(0)
197
197
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
198
198
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
199
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:12 ; 4-byte Folded Reload
199
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:12 th:TH_LOAD_LU ; 4-byte Folded Reload
200
200
; CHECK-NEXT: s_waitcnt vmcnt(0)
201
201
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
202
202
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
203
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:16 ; 4-byte Folded Reload
203
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:16 th:TH_LOAD_LU ; 4-byte Folded Reload
204
204
; CHECK-NEXT: s_waitcnt vmcnt(0)
205
205
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
206
206
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
207
207
; CHECK-NEXT: .LBB1_4: ; %.exit
208
208
; CHECK-NEXT: s_or_b32 exec_lo, exec_lo, s0
209
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:4 ; 4-byte Folded Reload
209
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:4 th:TH_LOAD_LU ; 4-byte Folded Reload
210
210
; CHECK-NEXT: s_waitcnt vmcnt(0)
211
211
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
212
212
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
213
- ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:8 ; 4-byte Folded Reload
213
+ ; CHECK-NEXT: scratch_load_b32 v0, off, off offset:8 th:TH_LOAD_LU ; 4-byte Folded Reload
214
214
; CHECK-NEXT: s_waitcnt vmcnt(0)
215
215
; CHECK-NEXT: global_store_b32 v[0:1], v0, off th:TH_STORE_NT_RT
216
216
; CHECK-NEXT: s_waitcnt_vscnt null, 0x0
0 commit comments