Skip to content

Commit 5130b1a

Browse files
committed
Update tests
Signed-off-by: John Lu <[email protected]>
1 parent 9dc8247 commit 5130b1a

File tree

2 files changed

+31
-32
lines changed

2 files changed

+31
-32
lines changed

llvm/test/CodeGen/AMDGPU/ashr.v2i16.ll

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -685,16 +685,16 @@ define amdgpu_kernel void @ashr_v_imm_v4i16(ptr addrspace(1) %out, ptr addrspace
685685
; CI-NEXT: buffer_load_dwordx2 v[2:3], v[0:1], s[4:7], 0 addr64
686686
; CI-NEXT: s_mov_b64 s[2:3], s[6:7]
687687
; CI-NEXT: s_waitcnt vmcnt(0)
688-
; CI-NEXT: v_bfe_i32 v6, v3, 0, 16
689-
; CI-NEXT: v_ashr_i64 v[3:4], v[2:3], 56
690-
; CI-NEXT: v_bfe_i32 v5, v2, 0, 16
688+
; CI-NEXT: v_bfe_i32 v4, v2, 0, 16
689+
; CI-NEXT: v_bfe_i32 v5, v3, 0, 16
690+
; CI-NEXT: v_ashrrev_i32_e32 v3, 24, v3
691691
; CI-NEXT: v_ashrrev_i32_e32 v2, 24, v2
692-
; CI-NEXT: v_bfe_u32 v4, v6, 8, 16
693-
; CI-NEXT: v_lshlrev_b32_e32 v2, 16, v2
694-
; CI-NEXT: v_bfe_u32 v5, v5, 8, 16
695692
; CI-NEXT: v_lshlrev_b32_e32 v3, 16, v3
696-
; CI-NEXT: v_or_b32_e32 v3, v4, v3
697-
; CI-NEXT: v_or_b32_e32 v2, v5, v2
693+
; CI-NEXT: v_bfe_u32 v5, v5, 8, 16
694+
; CI-NEXT: v_lshlrev_b32_e32 v2, 16, v2
695+
; CI-NEXT: v_bfe_u32 v4, v4, 8, 16
696+
; CI-NEXT: v_or_b32_e32 v3, v5, v3
697+
; CI-NEXT: v_or_b32_e32 v2, v4, v2
698698
; CI-NEXT: buffer_store_dwordx2 v[2:3], v[0:1], s[0:3], 0 addr64
699699
; CI-NEXT: s_endpgm
700700
;

llvm/test/CodeGen/AMDGPU/load-constant-i8.ll

Lines changed: 23 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -7475,12 +7475,17 @@ define amdgpu_kernel void @constant_sextload_v16i8_to_v16i64(ptr addrspace(1) %o
74757475
; GFX12-NEXT: s_clause 0x1
74767476
; GFX12-NEXT: global_store_b128 v24, v[0:3], s[0:1] offset:112
74777477
; GFX12-NEXT: global_store_b128 v24, v[8:11], s[0:1] offset:96
7478-
; GFX12-NEXT: v_dual_mov_b32 v0, s22 :: v_dual_mov_b32 v3, s21
7479-
; GFX12-NEXT: v_dual_mov_b32 v1, s23 :: v_dual_mov_b32 v2, s20
7480-
; GFX12-NEXT: v_dual_mov_b32 v9, s25 :: v_dual_mov_b32 v8, s24
7481-
; GFX12-NEXT: v_dual_mov_b32 v11, s27 :: v_dual_mov_b32 v10, s26
7482-
; GFX12-NEXT: v_dual_mov_b32 v21, s31 :: v_dual_mov_b32 v20, s30
7483-
; GFX12-NEXT: v_dual_mov_b32 v23, s29 :: v_dual_mov_b32 v22, s28
7478+
; GFX12-NEXT: v_dual_mov_b32 v0, s20 :: v_dual_mov_b32 v3, s29
7479+
; GFX12-NEXT: v_dual_mov_b32 v1, s21 :: v_dual_mov_b32 v2, s31
7480+
; GFX12-NEXT: v_mov_b32_e32 v9, s25
7481+
; GFX12-NEXT: s_bfe_i64 s[2:3], s[4:5], 0x80000
7482+
; GFX12-NEXT: s_bfe_i64 s[4:5], s[30:31], 0x80000
7483+
; GFX12-NEXT: v_dual_mov_b32 v8, s24 :: v_dual_mov_b32 v11, s23
7484+
; GFX12-NEXT: v_dual_mov_b32 v10, s22 :: v_dual_mov_b32 v17, s27
7485+
; GFX12-NEXT: v_dual_mov_b32 v16, s26 :: v_dual_mov_b32 v19, s7
7486+
; GFX12-NEXT: v_dual_mov_b32 v18, s6 :: v_dual_mov_b32 v21, s3
7487+
; GFX12-NEXT: v_dual_mov_b32 v20, s2 :: v_dual_mov_b32 v23, s5
7488+
; GFX12-NEXT: v_mov_b32_e32 v22, s4
74847489
; GFX12-NEXT: s_clause 0x5
74857490
; GFX12-NEXT: global_store_b128 v24, v[12:15], s[0:1] offset:80
74867491
; GFX12-NEXT: global_store_b128 v24, v[4:7], s[0:1] offset:64
@@ -9033,19 +9038,9 @@ define amdgpu_kernel void @constant_sextload_v32i8_to_v32i64(ptr addrspace(1) %o
90339038
; GFX12-NEXT: global_store_b128 v24, v[8:11], s[8:9] offset:208
90349039
; GFX12-NEXT: global_store_b128 v24, v[12:15], s[8:9] offset:192
90359040
; GFX12-NEXT: s_wait_alu 0xfffe
9036-
; GFX12-NEXT: v_dual_mov_b32 v0, s36 :: v_dual_mov_b32 v3, s71
9037-
; GFX12-NEXT: v_dual_mov_b32 v1, s37 :: v_dual_mov_b32 v2, s70
9038-
; GFX12-NEXT: v_mov_b32_e32 v5, s53
9039-
; GFX12-NEXT: s_lshr_b32 s34, s3, 8
9040-
; GFX12-NEXT: s_mov_b32 s30, s3
9041-
; GFX12-NEXT: s_lshr_b32 s24, s2, 16
9042-
; GFX12-NEXT: s_lshr_b32 s22, s2, 24
9043-
; GFX12-NEXT: s_bfe_i64 s[28:29], s[4:5], 0x80000
9044-
; GFX12-NEXT: s_bfe_i64 s[58:59], s[58:59], 0x80000
9045-
; GFX12-NEXT: v_dual_mov_b32 v4, s52 :: v_dual_mov_b32 v7, s51
9046-
; GFX12-NEXT: v_dual_mov_b32 v6, s50 :: v_dual_mov_b32 v9, s55
9047-
; GFX12-NEXT: s_lshr_b32 s20, s2, 8
9048-
; GFX12-NEXT: s_ashr_i64 s[26:27], s[2:3], 56
9041+
; GFX12-NEXT: v_dual_mov_b32 v0, s4 :: v_dual_mov_b32 v3, s62
9042+
; GFX12-NEXT: v_dual_mov_b32 v1, s5 :: v_dual_mov_b32 v2, s63
9043+
; GFX12-NEXT: v_mov_b32_e32 v5, s55
90499044
; GFX12-NEXT: s_bfe_i64 s[60:61], s[60:61], 0x80000
90509045
; GFX12-NEXT: v_dual_mov_b32 v4, s54 :: v_dual_mov_b32 v7, s53
90519046
; GFX12-NEXT: v_dual_mov_b32 v6, s52 :: v_dual_mov_b32 v9, s57
@@ -9077,11 +9072,15 @@ define amdgpu_kernel void @constant_sextload_v32i8_to_v32i64(ptr addrspace(1) %o
90779072
; GFX12-NEXT: global_store_b128 v24, v[12:15], s[8:9] offset:128
90789073
; GFX12-NEXT: global_store_b128 v24, v[16:19], s[8:9] offset:112
90799074
; GFX12-NEXT: global_store_b128 v24, v[20:23], s[8:9] offset:96
9080-
; GFX12-NEXT: v_dual_mov_b32 v0, s24 :: v_dual_mov_b32 v3, s23
9081-
; GFX12-NEXT: v_dual_mov_b32 v1, s25 :: v_dual_mov_b32 v2, s22
9082-
; GFX12-NEXT: v_mov_b32_e32 v5, s17
9083-
; GFX12-NEXT: s_lshr_b32 s68, s0, 8
9084-
; GFX12-NEXT: s_bfe_i64 s[6:7], s[62:63], 0x80000
9075+
; GFX12-NEXT: v_dual_mov_b32 v0, s28 :: v_dual_mov_b32 v3, s27
9076+
; GFX12-NEXT: v_dual_mov_b32 v1, s29 :: v_dual_mov_b32 v2, s26
9077+
; GFX12-NEXT: v_mov_b32_e32 v5, s21
9078+
; GFX12-NEXT: s_lshr_b32 s64, s0, 8
9079+
; GFX12-NEXT: s_bfe_i64 s[18:19], s[18:19], 0x80000
9080+
; GFX12-NEXT: s_bfe_i64 s[16:17], s[16:17], 0x80000
9081+
; GFX12-NEXT: v_dual_mov_b32 v4, s20 :: v_dual_mov_b32 v7, s25
9082+
; GFX12-NEXT: v_dual_mov_b32 v6, s24 :: v_dual_mov_b32 v9, s23
9083+
; GFX12-NEXT: s_bfe_i64 s[12:13], s[12:13], 0x80000
90859084
; GFX12-NEXT: s_bfe_i64 s[14:15], s[14:15], 0x80000
90869085
; GFX12-NEXT: s_wait_alu 0xfffe
90879086
; GFX12-NEXT: v_dual_mov_b32 v8, s22 :: v_dual_mov_b32 v11, s6

0 commit comments

Comments
 (0)