@@ -34,10 +34,9 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
34
34
; GLOBALNESS1-NEXT: s_mov_b64 s[36:37], s[6:7]
35
35
; GLOBALNESS1-NEXT: s_load_dwordx4 s[76:79], s[8:9], 0x0
36
36
; GLOBALNESS1-NEXT: s_load_dword s6, s[8:9], 0x14
37
- ; GLOBALNESS1-NEXT: v_mov_b32_e32 v41, v0
38
37
; GLOBALNESS1-NEXT: v_mov_b32_e32 v42, 0
39
- ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[0:1 ], 0, 0
40
- ; GLOBALNESS1-NEXT: global_store_dword v[0:1 ], v42, off
38
+ ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[44:45 ], 0, 0
39
+ ; GLOBALNESS1-NEXT: global_store_dword v[44:45 ], v42, off
41
40
; GLOBALNESS1-NEXT: s_waitcnt lgkmcnt(0)
42
41
; GLOBALNESS1-NEXT: global_load_dword v2, v42, s[76:77]
43
42
; GLOBALNESS1-NEXT: s_mov_b64 s[40:41], s[4:5]
@@ -46,6 +45,7 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
46
45
; GLOBALNESS1-NEXT: s_add_u32 flat_scratch_lo, s12, s17
47
46
; GLOBALNESS1-NEXT: s_addc_u32 flat_scratch_hi, s13, 0
48
47
; GLOBALNESS1-NEXT: s_add_u32 s0, s0, s17
48
+ ; GLOBALNESS1-NEXT: v_mov_b32_e32 v41, v0
49
49
; GLOBALNESS1-NEXT: v_mov_b32_e32 v0, 0
50
50
; GLOBALNESS1-NEXT: s_addc_u32 s1, s1, 0
51
51
; GLOBALNESS1-NEXT: v_mov_b32_e32 v1, 0x40994400
@@ -73,13 +73,15 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
73
73
; GLOBALNESS1-NEXT: v_cmp_ne_u32_e64 s[52:53], 1, v0
74
74
; GLOBALNESS1-NEXT: v_cmp_ne_u32_e64 s[44:45], 1, v1
75
75
; GLOBALNESS1-NEXT: v_cmp_ne_u32_e64 s[46:47], 1, v3
76
+ ; GLOBALNESS1-NEXT: v_mov_b32_e32 v46, 0x80
76
77
; GLOBALNESS1-NEXT: s_mov_b32 s70, s16
77
78
; GLOBALNESS1-NEXT: s_mov_b64 s[38:39], s[8:9]
78
79
; GLOBALNESS1-NEXT: s_mov_b32 s71, s15
79
80
; GLOBALNESS1-NEXT: s_mov_b32 s72, s14
80
81
; GLOBALNESS1-NEXT: s_mov_b64 s[34:35], s[10:11]
82
+ ; GLOBALNESS1-NEXT: v_mov_b32_e32 v47, 0
81
83
; GLOBALNESS1-NEXT: s_mov_b32 s32, 0
82
- ; GLOBALNESS1-NEXT: ; implicit-def: $vgpr44_vgpr45
84
+ ; GLOBALNESS1-NEXT: ; implicit-def: $vgpr56_vgpr57
83
85
; GLOBALNESS1-NEXT: s_waitcnt vmcnt(0)
84
86
; GLOBALNESS1-NEXT: v_cmp_gt_i32_e32 vcc, 0, v2
85
87
; GLOBALNESS1-NEXT: v_cndmask_b32_e64 v0, 0, 1, vcc
@@ -106,17 +108,15 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
106
108
; GLOBALNESS1-NEXT: .LBB1_3: ; %Flow28
107
109
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_4 Depth=1
108
110
; GLOBALNESS1-NEXT: s_and_b64 vcc, exec, s[6:7]
109
- ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[44:45 ], v[0:1], v[0:1] op_sel:[0,1]
111
+ ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[56:57 ], v[0:1], v[0:1] op_sel:[0,1]
110
112
; GLOBALNESS1-NEXT: s_cbranch_vccnz .LBB1_30
111
113
; GLOBALNESS1-NEXT: .LBB1_4: ; %bb5
112
114
; GLOBALNESS1-NEXT: ; =>This Loop Header: Depth=1
113
115
; GLOBALNESS1-NEXT: ; Child Loop BB1_16 Depth 2
114
- ; GLOBALNESS1-NEXT: v_mov_b32_e32 v0, 0x80
115
- ; GLOBALNESS1-NEXT: v_mov_b32_e32 v1, 0
116
- ; GLOBALNESS1-NEXT: flat_load_dword v40, v[0:1]
116
+ ; GLOBALNESS1-NEXT: flat_load_dword v40, v[46:47]
117
117
; GLOBALNESS1-NEXT: s_add_u32 s8, s38, 40
118
118
; GLOBALNESS1-NEXT: buffer_store_dword v42, off, s[0:3], 0
119
- ; GLOBALNESS1-NEXT: flat_load_dword v46 , v[0:1 ]
119
+ ; GLOBALNESS1-NEXT: flat_load_dword v58 , v[46:47 ]
120
120
; GLOBALNESS1-NEXT: s_addc_u32 s9, s39, 0
121
121
; GLOBALNESS1-NEXT: s_getpc_b64 s[4:5]
122
122
; GLOBALNESS1-NEXT: s_add_u32 s4, s4, wobble@gotpcrel32@lo+4
@@ -160,8 +160,7 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
160
160
; GLOBALNESS1-NEXT: s_cbranch_vccz .LBB1_24
161
161
; GLOBALNESS1-NEXT: ; %bb.10: ; %baz.exit.i
162
162
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_4 Depth=1
163
- ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[2:3], 0, 0
164
- ; GLOBALNESS1-NEXT: flat_load_dword v0, v[2:3]
163
+ ; GLOBALNESS1-NEXT: flat_load_dword v0, v[44:45]
165
164
; GLOBALNESS1-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
166
165
; GLOBALNESS1-NEXT: v_cmp_gt_i32_e64 s[62:63], 0, v0
167
166
; GLOBALNESS1-NEXT: v_mov_b32_e32 v0, 0
@@ -170,17 +169,16 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
170
169
; GLOBALNESS1-NEXT: s_cbranch_execz .LBB1_26
171
170
; GLOBALNESS1-NEXT: ; %bb.11: ; %bb33.i
172
171
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_4 Depth=1
173
- ; GLOBALNESS1-NEXT: global_load_dwordx2 v[0:1], v[2:3 ], off
172
+ ; GLOBALNESS1-NEXT: global_load_dwordx2 v[0:1], v[44:45 ], off
174
173
; GLOBALNESS1-NEXT: s_and_b64 vcc, exec, s[54:55]
175
174
; GLOBALNESS1-NEXT: s_cbranch_vccnz .LBB1_13
176
175
; GLOBALNESS1-NEXT: ; %bb.12: ; %bb39.i
177
176
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_4 Depth=1
178
177
; GLOBALNESS1-NEXT: v_mov_b32_e32 v43, v42
179
- ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[2:3], 0, 0
180
- ; GLOBALNESS1-NEXT: global_store_dwordx2 v[2:3], v[42:43], off
178
+ ; GLOBALNESS1-NEXT: global_store_dwordx2 v[44:45], v[42:43], off
181
179
; GLOBALNESS1-NEXT: .LBB1_13: ; %bb44.lr.ph.i
182
180
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_4 Depth=1
183
- ; GLOBALNESS1-NEXT: v_cmp_ne_u32_e32 vcc, 0, v46
181
+ ; GLOBALNESS1-NEXT: v_cmp_ne_u32_e32 vcc, 0, v58
184
182
; GLOBALNESS1-NEXT: v_cndmask_b32_e32 v2, 0, v40, vcc
185
183
; GLOBALNESS1-NEXT: s_waitcnt vmcnt(0)
186
184
; GLOBALNESS1-NEXT: v_cmp_nlt_f64_e32 vcc, 0, v[0:1]
@@ -237,7 +235,6 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
237
235
; GLOBALNESS1-NEXT: v_mov_b32_e32 v31, v41
238
236
; GLOBALNESS1-NEXT: s_waitcnt lgkmcnt(0)
239
237
; GLOBALNESS1-NEXT: s_swappc_b64 s[30:31], s[76:77]
240
- ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[46:47], 0, 0
241
238
; GLOBALNESS1-NEXT: s_mov_b64 s[4:5], s[40:41]
242
239
; GLOBALNESS1-NEXT: s_mov_b64 s[6:7], s[36:37]
243
240
; GLOBALNESS1-NEXT: s_mov_b64 s[8:9], s[68:69]
@@ -246,14 +243,14 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
246
243
; GLOBALNESS1-NEXT: s_mov_b32 s13, s71
247
244
; GLOBALNESS1-NEXT: s_mov_b32 s14, s70
248
245
; GLOBALNESS1-NEXT: v_mov_b32_e32 v31, v41
249
- ; GLOBALNESS1-NEXT: global_store_dwordx2 v[46:47 ], v[44:45 ], off
246
+ ; GLOBALNESS1-NEXT: global_store_dwordx2 v[44:45 ], v[56:57 ], off
250
247
; GLOBALNESS1-NEXT: s_swappc_b64 s[30:31], s[76:77]
251
248
; GLOBALNESS1-NEXT: s_and_saveexec_b64 s[4:5], s[64:65]
252
249
; GLOBALNESS1-NEXT: s_cbranch_execz .LBB1_14
253
250
; GLOBALNESS1-NEXT: ; %bb.23: ; %bb62.i
254
251
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_16 Depth=2
255
252
; GLOBALNESS1-NEXT: v_mov_b32_e32 v43, v42
256
- ; GLOBALNESS1-NEXT: global_store_dwordx2 v[46:47 ], v[42:43], off
253
+ ; GLOBALNESS1-NEXT: global_store_dwordx2 v[44:45 ], v[42:43], off
257
254
; GLOBALNESS1-NEXT: s_branch .LBB1_14
258
255
; GLOBALNESS1-NEXT: .LBB1_24: ; in Loop: Header=BB1_4 Depth=1
259
256
; GLOBALNESS1-NEXT: s_mov_b64 s[6:7], -1
@@ -274,14 +271,12 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
274
271
; GLOBALNESS1-NEXT: ; %bb.28: ; %bb69.i
275
272
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_4 Depth=1
276
273
; GLOBALNESS1-NEXT: v_mov_b32_e32 v43, v42
277
- ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[2:3], 0, 0
278
- ; GLOBALNESS1-NEXT: global_store_dwordx2 v[2:3], v[42:43], off
274
+ ; GLOBALNESS1-NEXT: global_store_dwordx2 v[44:45], v[42:43], off
279
275
; GLOBALNESS1-NEXT: s_branch .LBB1_1
280
276
; GLOBALNESS1-NEXT: .LBB1_29: ; %bb73.i
281
277
; GLOBALNESS1-NEXT: ; in Loop: Header=BB1_4 Depth=1
282
278
; GLOBALNESS1-NEXT: v_mov_b32_e32 v43, v42
283
- ; GLOBALNESS1-NEXT: v_pk_mov_b32 v[2:3], 0, 0
284
- ; GLOBALNESS1-NEXT: global_store_dwordx2 v[2:3], v[42:43], off
279
+ ; GLOBALNESS1-NEXT: global_store_dwordx2 v[44:45], v[42:43], off
285
280
; GLOBALNESS1-NEXT: s_branch .LBB1_2
286
281
; GLOBALNESS1-NEXT: .LBB1_30: ; %loop.exit.guard
287
282
; GLOBALNESS1-NEXT: s_andn2_b64 vcc, exec, s[4:5]
@@ -326,10 +321,9 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
326
321
; GLOBALNESS0-NEXT: s_mov_b64 s[36:37], s[6:7]
327
322
; GLOBALNESS0-NEXT: s_load_dwordx4 s[72:75], s[8:9], 0x0
328
323
; GLOBALNESS0-NEXT: s_load_dword s6, s[8:9], 0x14
329
- ; GLOBALNESS0-NEXT: v_mov_b32_e32 v41, v0
330
324
; GLOBALNESS0-NEXT: v_mov_b32_e32 v42, 0
331
- ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[0:1 ], 0, 0
332
- ; GLOBALNESS0-NEXT: global_store_dword v[0:1 ], v42, off
325
+ ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[44:45 ], 0, 0
326
+ ; GLOBALNESS0-NEXT: global_store_dword v[44:45 ], v42, off
333
327
; GLOBALNESS0-NEXT: s_waitcnt lgkmcnt(0)
334
328
; GLOBALNESS0-NEXT: global_load_dword v2, v42, s[72:73]
335
329
; GLOBALNESS0-NEXT: s_mov_b64 s[40:41], s[4:5]
@@ -338,6 +332,7 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
338
332
; GLOBALNESS0-NEXT: s_add_u32 flat_scratch_lo, s12, s17
339
333
; GLOBALNESS0-NEXT: s_addc_u32 flat_scratch_hi, s13, 0
340
334
; GLOBALNESS0-NEXT: s_add_u32 s0, s0, s17
335
+ ; GLOBALNESS0-NEXT: v_mov_b32_e32 v41, v0
341
336
; GLOBALNESS0-NEXT: v_mov_b32_e32 v0, 0
342
337
; GLOBALNESS0-NEXT: s_addc_u32 s1, s1, 0
343
338
; GLOBALNESS0-NEXT: v_mov_b32_e32 v1, 0x40994400
@@ -365,13 +360,15 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
365
360
; GLOBALNESS0-NEXT: v_cmp_ne_u32_e64 s[52:53], 1, v0
366
361
; GLOBALNESS0-NEXT: v_cmp_ne_u32_e64 s[44:45], 1, v1
367
362
; GLOBALNESS0-NEXT: v_cmp_ne_u32_e64 s[46:47], 1, v3
363
+ ; GLOBALNESS0-NEXT: v_mov_b32_e32 v46, 0x80
368
364
; GLOBALNESS0-NEXT: s_mov_b32 s68, s16
369
365
; GLOBALNESS0-NEXT: s_mov_b64 s[38:39], s[8:9]
370
366
; GLOBALNESS0-NEXT: s_mov_b32 s69, s15
371
367
; GLOBALNESS0-NEXT: s_mov_b32 s70, s14
372
368
; GLOBALNESS0-NEXT: s_mov_b64 s[34:35], s[10:11]
369
+ ; GLOBALNESS0-NEXT: v_mov_b32_e32 v47, 0
373
370
; GLOBALNESS0-NEXT: s_mov_b32 s32, 0
374
- ; GLOBALNESS0-NEXT: ; implicit-def: $vgpr44_vgpr45
371
+ ; GLOBALNESS0-NEXT: ; implicit-def: $vgpr56_vgpr57
375
372
; GLOBALNESS0-NEXT: s_waitcnt vmcnt(0)
376
373
; GLOBALNESS0-NEXT: v_cmp_gt_i32_e32 vcc, 0, v2
377
374
; GLOBALNESS0-NEXT: v_cndmask_b32_e64 v0, 0, 1, vcc
@@ -398,17 +395,15 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
398
395
; GLOBALNESS0-NEXT: .LBB1_3: ; %Flow28
399
396
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_4 Depth=1
400
397
; GLOBALNESS0-NEXT: s_and_b64 vcc, exec, s[6:7]
401
- ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[44:45 ], v[0:1], v[0:1] op_sel:[0,1]
398
+ ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[56:57 ], v[0:1], v[0:1] op_sel:[0,1]
402
399
; GLOBALNESS0-NEXT: s_cbranch_vccnz .LBB1_30
403
400
; GLOBALNESS0-NEXT: .LBB1_4: ; %bb5
404
401
; GLOBALNESS0-NEXT: ; =>This Loop Header: Depth=1
405
402
; GLOBALNESS0-NEXT: ; Child Loop BB1_16 Depth 2
406
- ; GLOBALNESS0-NEXT: v_mov_b32_e32 v0, 0x80
407
- ; GLOBALNESS0-NEXT: v_mov_b32_e32 v1, 0
408
- ; GLOBALNESS0-NEXT: flat_load_dword v40, v[0:1]
403
+ ; GLOBALNESS0-NEXT: flat_load_dword v40, v[46:47]
409
404
; GLOBALNESS0-NEXT: s_add_u32 s8, s38, 40
410
405
; GLOBALNESS0-NEXT: buffer_store_dword v42, off, s[0:3], 0
411
- ; GLOBALNESS0-NEXT: flat_load_dword v46 , v[0:1 ]
406
+ ; GLOBALNESS0-NEXT: flat_load_dword v58 , v[46:47 ]
412
407
; GLOBALNESS0-NEXT: s_addc_u32 s9, s39, 0
413
408
; GLOBALNESS0-NEXT: s_getpc_b64 s[4:5]
414
409
; GLOBALNESS0-NEXT: s_add_u32 s4, s4, wobble@gotpcrel32@lo+4
@@ -452,8 +447,7 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
452
447
; GLOBALNESS0-NEXT: s_cbranch_vccz .LBB1_24
453
448
; GLOBALNESS0-NEXT: ; %bb.10: ; %baz.exit.i
454
449
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_4 Depth=1
455
- ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[2:3], 0, 0
456
- ; GLOBALNESS0-NEXT: flat_load_dword v0, v[2:3]
450
+ ; GLOBALNESS0-NEXT: flat_load_dword v0, v[44:45]
457
451
; GLOBALNESS0-NEXT: s_waitcnt vmcnt(0) lgkmcnt(0)
458
452
; GLOBALNESS0-NEXT: v_cmp_gt_i32_e64 s[62:63], 0, v0
459
453
; GLOBALNESS0-NEXT: v_mov_b32_e32 v0, 0
@@ -462,17 +456,16 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
462
456
; GLOBALNESS0-NEXT: s_cbranch_execz .LBB1_26
463
457
; GLOBALNESS0-NEXT: ; %bb.11: ; %bb33.i
464
458
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_4 Depth=1
465
- ; GLOBALNESS0-NEXT: global_load_dwordx2 v[0:1], v[2:3 ], off
459
+ ; GLOBALNESS0-NEXT: global_load_dwordx2 v[0:1], v[44:45 ], off
466
460
; GLOBALNESS0-NEXT: s_and_b64 vcc, exec, s[54:55]
467
461
; GLOBALNESS0-NEXT: s_cbranch_vccnz .LBB1_13
468
462
; GLOBALNESS0-NEXT: ; %bb.12: ; %bb39.i
469
463
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_4 Depth=1
470
464
; GLOBALNESS0-NEXT: v_mov_b32_e32 v43, v42
471
- ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[2:3], 0, 0
472
- ; GLOBALNESS0-NEXT: global_store_dwordx2 v[2:3], v[42:43], off
465
+ ; GLOBALNESS0-NEXT: global_store_dwordx2 v[44:45], v[42:43], off
473
466
; GLOBALNESS0-NEXT: .LBB1_13: ; %bb44.lr.ph.i
474
467
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_4 Depth=1
475
- ; GLOBALNESS0-NEXT: v_cmp_ne_u32_e32 vcc, 0, v46
468
+ ; GLOBALNESS0-NEXT: v_cmp_ne_u32_e32 vcc, 0, v58
476
469
; GLOBALNESS0-NEXT: v_cndmask_b32_e32 v2, 0, v40, vcc
477
470
; GLOBALNESS0-NEXT: s_waitcnt vmcnt(0)
478
471
; GLOBALNESS0-NEXT: v_cmp_nlt_f64_e32 vcc, 0, v[0:1]
@@ -529,7 +522,6 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
529
522
; GLOBALNESS0-NEXT: v_mov_b32_e32 v31, v41
530
523
; GLOBALNESS0-NEXT: s_waitcnt lgkmcnt(0)
531
524
; GLOBALNESS0-NEXT: s_swappc_b64 s[30:31], s[78:79]
532
- ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[46:47], 0, 0
533
525
; GLOBALNESS0-NEXT: s_mov_b64 s[4:5], s[40:41]
534
526
; GLOBALNESS0-NEXT: s_mov_b64 s[6:7], s[36:37]
535
527
; GLOBALNESS0-NEXT: s_mov_b64 s[8:9], s[72:73]
@@ -538,14 +530,14 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
538
530
; GLOBALNESS0-NEXT: s_mov_b32 s13, s69
539
531
; GLOBALNESS0-NEXT: s_mov_b32 s14, s68
540
532
; GLOBALNESS0-NEXT: v_mov_b32_e32 v31, v41
541
- ; GLOBALNESS0-NEXT: global_store_dwordx2 v[46:47 ], v[44:45 ], off
533
+ ; GLOBALNESS0-NEXT: global_store_dwordx2 v[44:45 ], v[56:57 ], off
542
534
; GLOBALNESS0-NEXT: s_swappc_b64 s[30:31], s[78:79]
543
535
; GLOBALNESS0-NEXT: s_and_saveexec_b64 s[4:5], s[64:65]
544
536
; GLOBALNESS0-NEXT: s_cbranch_execz .LBB1_14
545
537
; GLOBALNESS0-NEXT: ; %bb.23: ; %bb62.i
546
538
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_16 Depth=2
547
539
; GLOBALNESS0-NEXT: v_mov_b32_e32 v43, v42
548
- ; GLOBALNESS0-NEXT: global_store_dwordx2 v[46:47 ], v[42:43], off
540
+ ; GLOBALNESS0-NEXT: global_store_dwordx2 v[44:45 ], v[42:43], off
549
541
; GLOBALNESS0-NEXT: s_branch .LBB1_14
550
542
; GLOBALNESS0-NEXT: .LBB1_24: ; in Loop: Header=BB1_4 Depth=1
551
543
; GLOBALNESS0-NEXT: s_mov_b64 s[6:7], -1
@@ -566,14 +558,12 @@ define amdgpu_kernel void @kernel(ptr addrspace(1) %arg1.global, i1 %tmp3.i.i, i
566
558
; GLOBALNESS0-NEXT: ; %bb.28: ; %bb69.i
567
559
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_4 Depth=1
568
560
; GLOBALNESS0-NEXT: v_mov_b32_e32 v43, v42
569
- ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[2:3], 0, 0
570
- ; GLOBALNESS0-NEXT: global_store_dwordx2 v[2:3], v[42:43], off
561
+ ; GLOBALNESS0-NEXT: global_store_dwordx2 v[44:45], v[42:43], off
571
562
; GLOBALNESS0-NEXT: s_branch .LBB1_1
572
563
; GLOBALNESS0-NEXT: .LBB1_29: ; %bb73.i
573
564
; GLOBALNESS0-NEXT: ; in Loop: Header=BB1_4 Depth=1
574
565
; GLOBALNESS0-NEXT: v_mov_b32_e32 v43, v42
575
- ; GLOBALNESS0-NEXT: v_pk_mov_b32 v[2:3], 0, 0
576
- ; GLOBALNESS0-NEXT: global_store_dwordx2 v[2:3], v[42:43], off
566
+ ; GLOBALNESS0-NEXT: global_store_dwordx2 v[44:45], v[42:43], off
577
567
; GLOBALNESS0-NEXT: s_branch .LBB1_2
578
568
; GLOBALNESS0-NEXT: .LBB1_30: ; %loop.exit.guard
579
569
; GLOBALNESS0-NEXT: s_andn2_b64 vcc, exec, s[4:5]
0 commit comments