Skip to content

Commit 6882125

Browse files
committed
[SDag] Notify listeners when deleting a node
SelectionDAG::DeleteNode does not notify listeners about node deletion. As a result, SelectionDAG::Legalize may skip legalization of some nodes resulting in "Legalized selection DAG" containing illegal nodes. These nodes will be legalized during subsequent DAG combining phase, but this may be too late for some patterns to match.
1 parent bb17651 commit 6882125

15 files changed

+1302
-1260
lines changed

llvm/lib/CodeGen/SelectionDAG/SelectionDAG.cpp

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1087,6 +1087,9 @@ void SelectionDAG::RemoveDeadNode(SDNode *N){
10871087
}
10881088

10891089
void SelectionDAG::DeleteNode(SDNode *N) {
1090+
for (DAGUpdateListener *DUL = UpdateListeners; DUL; DUL = DUL->Next)
1091+
DUL->NodeDeleted(N, nullptr);
1092+
10901093
// First take this out of the appropriate CSE map.
10911094
RemoveNodeFromCSEMaps(N);
10921095

llvm/test/CodeGen/AMDGPU/half.ll

Lines changed: 73 additions & 73 deletions
Original file line numberDiff line numberDiff line change
@@ -2317,7 +2317,7 @@ define amdgpu_kernel void @global_extload_v16f16_to_v16f64(ptr addrspace(1) %out
23172317
; VI-NEXT: s_addc_u32 s3, s1, 0
23182318
; VI-NEXT: v_mov_b32_e32 v18, s3
23192319
; VI-NEXT: v_mov_b32_e32 v17, s2
2320-
; VI-NEXT: s_add_u32 s2, s0, 0x50
2320+
; VI-NEXT: s_add_u32 s2, s0, 0x70
23212321
; VI-NEXT: v_mov_b32_e32 v12, s1
23222322
; VI-NEXT: s_addc_u32 s3, s1, 0
23232323
; VI-NEXT: v_mov_b32_e32 v11, s0
@@ -2331,12 +2331,12 @@ define amdgpu_kernel void @global_extload_v16f16_to_v16f64(ptr addrspace(1) %out
23312331
; VI-NEXT: v_cvt_f32_f16_e32 v7, v6
23322332
; VI-NEXT: v_cvt_f32_f16_sdwa v8, v6 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
23332333
; VI-NEXT: s_waitcnt vmcnt(1)
2334-
; VI-NEXT: v_cvt_f32_f16_e32 v10, v2
2334+
; VI-NEXT: v_cvt_f32_f16_e32 v10, v0
23352335
; VI-NEXT: v_mov_b32_e32 v14, s3
23362336
; VI-NEXT: v_cvt_f64_f32_e32 v[6:7], v7
23372337
; VI-NEXT: v_cvt_f64_f32_e32 v[8:9], v8
23382338
; VI-NEXT: v_mov_b32_e32 v13, s2
2339-
; VI-NEXT: s_add_u32 s2, s0, 64
2339+
; VI-NEXT: s_add_u32 s2, s0, 0x60
23402340
; VI-NEXT: s_addc_u32 s3, s1, 0
23412341
; VI-NEXT: flat_store_dwordx4 v[15:16], v[6:9]
23422342
; VI-NEXT: v_mov_b32_e32 v16, s3
@@ -2347,37 +2347,37 @@ define amdgpu_kernel void @global_extload_v16f16_to_v16f64(ptr addrspace(1) %out
23472347
; VI-NEXT: v_cvt_f64_f32_e32 v[4:5], v6
23482348
; VI-NEXT: v_cvt_f64_f32_e32 v[6:7], v7
23492349
; VI-NEXT: v_mov_b32_e32 v15, s2
2350-
; VI-NEXT: s_add_u32 s2, s0, 0x70
2350+
; VI-NEXT: s_add_u32 s2, s0, 0x50
23512351
; VI-NEXT: s_addc_u32 s3, s1, 0
23522352
; VI-NEXT: flat_store_dwordx4 v[17:18], v[4:7]
2353-
; VI-NEXT: v_cvt_f32_f16_sdwa v17, v3 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
2353+
; VI-NEXT: v_cvt_f32_f16_sdwa v17, v0 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
23542354
; VI-NEXT: v_cvt_f64_f32_e32 v[4:5], v8
23552355
; VI-NEXT: v_cvt_f64_f32_e32 v[6:7], v9
2356-
; VI-NEXT: v_cvt_f32_f16_sdwa v9, v1 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
2357-
; VI-NEXT: v_cvt_f32_f16_sdwa v8, v2 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
2358-
; VI-NEXT: v_cvt_f32_f16_e32 v2, v1
2356+
; VI-NEXT: v_cvt_f32_f16_sdwa v8, v3 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
2357+
; VI-NEXT: v_cvt_f32_f16_e32 v0, v3
2358+
; VI-NEXT: s_add_u32 s0, s0, 64
23592359
; VI-NEXT: flat_store_dwordx4 v[11:12], v[4:7]
2360-
; VI-NEXT: v_cvt_f32_f16_sdwa v11, v0 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
2361-
; VI-NEXT: v_cvt_f32_f16_e32 v7, v3
2362-
; VI-NEXT: v_cvt_f64_f32_e32 v[3:4], v9
2363-
; VI-NEXT: v_cvt_f32_f16_e32 v9, v0
2364-
; VI-NEXT: v_cvt_f64_f32_e32 v[1:2], v2
2365-
; VI-NEXT: v_cvt_f64_f32_e32 v[5:6], v10
2366-
; VI-NEXT: v_cvt_f64_f32_e32 v[11:12], v11
2367-
; VI-NEXT: v_cvt_f64_f32_e32 v[9:10], v9
2368-
; VI-NEXT: s_add_u32 s0, s0, 0x60
2369-
; VI-NEXT: flat_store_dwordx4 v[13:14], v[1:4]
2360+
; VI-NEXT: v_cvt_f32_f16_sdwa v12, v1 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
2361+
; VI-NEXT: v_cvt_f64_f32_e32 v[5:6], v8
2362+
; VI-NEXT: v_cvt_f32_f16_e32 v8, v2
2363+
; VI-NEXT: v_cvt_f32_f16_sdwa v2, v2 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1
2364+
; VI-NEXT: v_cvt_f32_f16_e32 v7, v1
2365+
; VI-NEXT: v_cvt_f64_f32_e32 v[3:4], v0
2366+
; VI-NEXT: v_cvt_f64_f32_e32 v[0:1], v10
2367+
; VI-NEXT: v_cvt_f64_f32_e32 v[8:9], v8
2368+
; VI-NEXT: v_cvt_f64_f32_e32 v[10:11], v2
2369+
; VI-NEXT: flat_store_dwordx4 v[13:14], v[3:6]
23702370
; VI-NEXT: s_addc_u32 s1, s1, 0
2371-
; VI-NEXT: v_cvt_f64_f32_e32 v[0:1], v7
2371+
; VI-NEXT: v_cvt_f64_f32_e32 v[4:5], v7
2372+
; VI-NEXT: v_cvt_f64_f32_e32 v[6:7], v12
23722373
; VI-NEXT: v_cvt_f64_f32_e32 v[2:3], v17
2373-
; VI-NEXT: v_cvt_f64_f32_e32 v[7:8], v8
23742374
; VI-NEXT: v_mov_b32_e32 v20, s3
2375-
; VI-NEXT: v_mov_b32_e32 v14, s1
2375+
; VI-NEXT: v_mov_b32_e32 v13, s1
23762376
; VI-NEXT: v_mov_b32_e32 v19, s2
2377-
; VI-NEXT: v_mov_b32_e32 v13, s0
2378-
; VI-NEXT: flat_store_dwordx4 v[15:16], v[9:12]
2379-
; VI-NEXT: flat_store_dwordx4 v[19:20], v[0:3]
2380-
; VI-NEXT: flat_store_dwordx4 v[13:14], v[5:8]
2377+
; VI-NEXT: v_mov_b32_e32 v12, s0
2378+
; VI-NEXT: flat_store_dwordx4 v[15:16], v[8:11]
2379+
; VI-NEXT: flat_store_dwordx4 v[19:20], v[4:7]
2380+
; VI-NEXT: flat_store_dwordx4 v[12:13], v[0:3]
23812381
; VI-NEXT: s_endpgm
23822382
;
23832383
; GFX11-TRUE16-LABEL: global_extload_v16f16_to_v16f64:
@@ -2389,40 +2389,40 @@ define amdgpu_kernel void @global_extload_v16f16_to_v16f64(ptr addrspace(1) %out
23892389
; GFX11-TRUE16-NEXT: global_load_b128 v[0:3], v32, s[2:3]
23902390
; GFX11-TRUE16-NEXT: global_load_b128 v[4:7], v32, s[2:3] offset:16
23912391
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(1)
2392-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v10, v1.l
2393-
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0)
2394-
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v23, 16, v5
23952392
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v11, 16, v1
2396-
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v19, 16, v4
2397-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v15, v7.l
2393+
; GFX11-TRUE16-NEXT: s_waitcnt vmcnt(0)
2394+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v23, v7.l
23982395
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v7, 16, v7
2399-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v14, v6.l
2396+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v22, v6.l
24002397
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v6, 16, v6
2398+
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v19, 16, v5
2399+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v10, v1.l
2400+
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v15, 16, v4
24012401
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v13, v3.l
24022402
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v3, 16, v3
24032403
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v12, v2.l
24042404
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v2, 16, v2
2405-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v18, v4.l
2406-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v22, v5.l
2407-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[4:5], v10
2408-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v10, v23.l
2409-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v34, v11.l
2410-
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v11, v19.l
2411-
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v9, 16, v0
24122405
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v7, v7.l
24132406
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v6, v6.l
2407+
; GFX11-TRUE16-NEXT: v_lshrrev_b32_e32 v9, 16, v0
2408+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v18, v5.l
2409+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v34, v11.l
2410+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v11, v19.l
2411+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v14, v4.l
2412+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[4:5], v10
2413+
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v10, v15.l
24142414
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v8, v0.l
24152415
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v3, v3.l
24162416
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v2, v2.l
2417-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[28:29], v22
2418-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[30:31], v10
2419-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[24:25], v18
2420-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[26:27], v11
2417+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[28:29], v23
2418+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[30:31], v7
2419+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[24:25], v22
2420+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[26:27], v6
24212421
; GFX11-TRUE16-NEXT: v_cvt_f32_f16_e32 v33, v9.l
2422-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[20:21], v15
2423-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[22:23], v7
2422+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[20:21], v18
2423+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[22:23], v11
24242424
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[16:17], v14
2425-
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[18:19], v6
2425+
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[18:19], v10
24262426
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[0:1], v8
24272427
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[8:9], v12
24282428
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[12:13], v13
@@ -2431,10 +2431,10 @@ define amdgpu_kernel void @global_extload_v16f16_to_v16f64(ptr addrspace(1) %out
24312431
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[6:7], v34
24322432
; GFX11-TRUE16-NEXT: v_cvt_f64_f32_e32 v[2:3], v33
24332433
; GFX11-TRUE16-NEXT: s_clause 0x7
2434-
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[28:31], s[0:1] offset:80
2435-
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[24:27], s[0:1] offset:64
2436-
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[20:23], s[0:1] offset:112
2437-
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[16:19], s[0:1] offset:96
2434+
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[28:31], s[0:1] offset:112
2435+
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[24:27], s[0:1] offset:96
2436+
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[20:23], s[0:1] offset:80
2437+
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[16:19], s[0:1] offset:64
24382438
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[12:15], s[0:1] offset:48
24392439
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[8:11], s[0:1] offset:32
24402440
; GFX11-TRUE16-NEXT: global_store_b128 v32, v[4:7], s[0:1] offset:16
@@ -2450,40 +2450,40 @@ define amdgpu_kernel void @global_extload_v16f16_to_v16f64(ptr addrspace(1) %out
24502450
; GFX11-FAKE16-NEXT: global_load_b128 v[0:3], v32, s[2:3]
24512451
; GFX11-FAKE16-NEXT: global_load_b128 v[4:7], v32, s[2:3] offset:16
24522452
; GFX11-FAKE16-NEXT: s_waitcnt vmcnt(1)
2453-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v10, v1
2454-
; GFX11-FAKE16-NEXT: s_waitcnt vmcnt(0)
2455-
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v23, 16, v5
24562453
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v11, 16, v1
2457-
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v19, 16, v4
2458-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v15, v7
2454+
; GFX11-FAKE16-NEXT: s_waitcnt vmcnt(0)
2455+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v23, v7
24592456
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v7, 16, v7
2460-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v14, v6
2457+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v22, v6
24612458
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v6, 16, v6
2459+
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v19, 16, v5
2460+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v10, v1
2461+
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v15, 16, v4
24622462
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v13, v3
24632463
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v3, 16, v3
24642464
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v12, v2
24652465
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v2, 16, v2
2466-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v18, v4
2467-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v22, v5
2468-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[4:5], v10
2469-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v10, v23
2470-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v34, v11
2471-
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v11, v19
2472-
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v9, 16, v0
24732466
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v7, v7
24742467
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v6, v6
2468+
; GFX11-FAKE16-NEXT: v_lshrrev_b32_e32 v9, 16, v0
2469+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v18, v5
2470+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v34, v11
2471+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v11, v19
2472+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v14, v4
2473+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[4:5], v10
2474+
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v10, v15
24752475
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v8, v0
24762476
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v3, v3
24772477
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v2, v2
2478-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[28:29], v22
2479-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[30:31], v10
2480-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[24:25], v18
2481-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[26:27], v11
2478+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[28:29], v23
2479+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[30:31], v7
2480+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[24:25], v22
2481+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[26:27], v6
24822482
; GFX11-FAKE16-NEXT: v_cvt_f32_f16_e32 v33, v9
2483-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[20:21], v15
2484-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[22:23], v7
2483+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[20:21], v18
2484+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[22:23], v11
24852485
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[16:17], v14
2486-
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[18:19], v6
2486+
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[18:19], v10
24872487
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[0:1], v8
24882488
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[8:9], v12
24892489
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[12:13], v13
@@ -2492,10 +2492,10 @@ define amdgpu_kernel void @global_extload_v16f16_to_v16f64(ptr addrspace(1) %out
24922492
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[6:7], v34
24932493
; GFX11-FAKE16-NEXT: v_cvt_f64_f32_e32 v[2:3], v33
24942494
; GFX11-FAKE16-NEXT: s_clause 0x7
2495-
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[28:31], s[0:1] offset:80
2496-
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[24:27], s[0:1] offset:64
2497-
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[20:23], s[0:1] offset:112
2498-
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[16:19], s[0:1] offset:96
2495+
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[28:31], s[0:1] offset:112
2496+
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[24:27], s[0:1] offset:96
2497+
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[20:23], s[0:1] offset:80
2498+
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[16:19], s[0:1] offset:64
24992499
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[12:15], s[0:1] offset:48
25002500
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[8:11], s[0:1] offset:32
25012501
; GFX11-FAKE16-NEXT: global_store_b128 v32, v[4:7], s[0:1] offset:16

0 commit comments

Comments
 (0)