|
3 | 3 | ; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx810 -verify-machineinstrs | FileCheck -check-prefixes=PREGFX10-PACKED %s
|
4 | 4 | ; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx900 -verify-machineinstrs | FileCheck -check-prefixes=PREGFX10-PACKED %s
|
5 | 5 | ; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1010 -verify-machineinstrs | FileCheck -check-prefixes=GFX10-PACKED %s
|
6 |
| -; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1100 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX11-PACKED %s |
7 |
| -; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1200 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-SDAG %s |
8 |
| -; RUN: llc < %s -global-isel -mtriple=amdgcn -mcpu=gfx1200 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-GISEL %s |
| 6 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1100 -mattr=+real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX11-PACKED,GFX11-PACKED-TRUE16 %s |
| 7 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1100 -mattr=-real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX11-PACKED,GFX11-PACKED-FAKE16 %s |
| 8 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1200 -mattr=+real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-SDAG,GFX12-PACKED-SDAG-TRUE16 %s |
| 9 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1200 -mattr=-real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-SDAG,GFX12-PACKED-SDAG-FAKE16 %s |
| 10 | +; RUN: llc < %s -global-isel -mtriple=amdgcn -mcpu=gfx1200 -mattr=+real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-GISEL,GFX12-PACKED-GISEL-TRUE16 %s |
| 11 | +; RUN: llc < %s -global-isel -mtriple=amdgcn -mcpu=gfx1200 -mattr=-real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-GISEL,GFX12-PACKED-GISEL-FAKE16 %s |
9 | 12 |
|
10 | 13 | define amdgpu_kernel void @tbuffer_store_d16_x(<4 x i32> %rsrc, half %data) {
|
11 | 14 | ; PREGFX10-UNPACKED-LABEL: tbuffer_store_d16_x:
|
@@ -36,25 +39,55 @@ define amdgpu_kernel void @tbuffer_store_d16_x(<4 x i32> %rsrc, half %data) {
|
36 | 39 | ; GFX10-PACKED-NEXT: tbuffer_store_format_d16_x v0, off, s[0:3], 0 format:[BUF_FMT_10_11_11_SSCALED]
|
37 | 40 | ; GFX10-PACKED-NEXT: s_endpgm
|
38 | 41 | ;
|
39 |
| -; GFX11-PACKED-LABEL: tbuffer_store_d16_x: |
40 |
| -; GFX11-PACKED: ; %bb.0: ; %main_body |
41 |
| -; GFX11-PACKED-NEXT: s_clause 0x1 |
42 |
| -; GFX11-PACKED-NEXT: s_load_b32 s6, s[4:5], 0x34 |
43 |
| -; GFX11-PACKED-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
44 |
| -; GFX11-PACKED-NEXT: s_waitcnt lgkmcnt(0) |
45 |
| -; GFX11-PACKED-NEXT: v_mov_b32_e32 v0, s6 |
46 |
| -; GFX11-PACKED-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], 0 format:[BUF_FMT_10_10_10_2_SNORM] |
47 |
| -; GFX11-PACKED-NEXT: s_endpgm |
| 42 | +; GFX11-PACKED-TRUE16-LABEL: tbuffer_store_d16_x: |
| 43 | +; GFX11-PACKED-TRUE16: ; %bb.0: ; %main_body |
| 44 | +; GFX11-PACKED-TRUE16-NEXT: s_clause 0x1 |
| 45 | +; GFX11-PACKED-TRUE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 46 | +; GFX11-PACKED-TRUE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 47 | +; GFX11-PACKED-TRUE16-NEXT: s_waitcnt lgkmcnt(0) |
| 48 | +; GFX11-PACKED-TRUE16-NEXT: v_mov_b16_e32 v0.l, s6 |
| 49 | +; GFX11-PACKED-TRUE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], 0 format:[BUF_FMT_10_10_10_2_SNORM] |
| 50 | +; GFX11-PACKED-TRUE16-NEXT: s_endpgm |
48 | 51 | ;
|
49 |
| -; GFX12-PACKED-LABEL: tbuffer_store_d16_x: |
50 |
| -; GFX12-PACKED: ; %bb.0: ; %main_body |
51 |
| -; GFX12-PACKED-NEXT: s_clause 0x1 |
52 |
| -; GFX12-PACKED-NEXT: s_load_b32 s6, s[4:5], 0x34 |
53 |
| -; GFX12-PACKED-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
54 |
| -; GFX12-PACKED-NEXT: s_wait_kmcnt 0x0 |
55 |
| -; GFX12-PACKED-NEXT: v_mov_b32_e32 v0, s6 |
56 |
| -; GFX12-PACKED-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
57 |
| -; GFX12-PACKED-NEXT: s_endpgm |
| 52 | +; GFX11-PACKED-FAKE16-LABEL: tbuffer_store_d16_x: |
| 53 | +; GFX11-PACKED-FAKE16: ; %bb.0: ; %main_body |
| 54 | +; GFX11-PACKED-FAKE16-NEXT: s_clause 0x1 |
| 55 | +; GFX11-PACKED-FAKE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 56 | +; GFX11-PACKED-FAKE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 57 | +; GFX11-PACKED-FAKE16-NEXT: s_waitcnt lgkmcnt(0) |
| 58 | +; GFX11-PACKED-FAKE16-NEXT: v_mov_b32_e32 v0, s6 |
| 59 | +; GFX11-PACKED-FAKE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], 0 format:[BUF_FMT_10_10_10_2_SNORM] |
| 60 | +; GFX11-PACKED-FAKE16-NEXT: s_endpgm |
| 61 | +; |
| 62 | +; GFX12-PACKED-SDAG-TRUE16-LABEL: tbuffer_store_d16_x: |
| 63 | +; GFX12-PACKED-SDAG-TRUE16: ; %bb.0: ; %main_body |
| 64 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_clause 0x1 |
| 65 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 66 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 67 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_wait_kmcnt 0x0 |
| 68 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: v_mov_b16_e32 v0.l, s6 |
| 69 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
| 70 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_endpgm |
| 71 | +; |
| 72 | +; GFX12-PACKED-SDAG-FAKE16-LABEL: tbuffer_store_d16_x: |
| 73 | +; GFX12-PACKED-SDAG-FAKE16: ; %bb.0: ; %main_body |
| 74 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_clause 0x1 |
| 75 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 76 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 77 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_wait_kmcnt 0x0 |
| 78 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: v_mov_b32_e32 v0, s6 |
| 79 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
| 80 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_endpgm |
| 81 | +; |
| 82 | +; GFX12-PACKED-GISEL-LABEL: tbuffer_store_d16_x: |
| 83 | +; GFX12-PACKED-GISEL: ; %bb.0: ; %main_body |
| 84 | +; GFX12-PACKED-GISEL-NEXT: s_clause 0x1 |
| 85 | +; GFX12-PACKED-GISEL-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 86 | +; GFX12-PACKED-GISEL-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 87 | +; GFX12-PACKED-GISEL-NEXT: s_wait_kmcnt 0x0 |
| 88 | +; GFX12-PACKED-GISEL-NEXT: v_mov_b32_e32 v0, s6 |
| 89 | +; GFX12-PACKED-GISEL-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
| 90 | +; GFX12-PACKED-GISEL-NEXT: s_endpgm |
58 | 91 | main_body:
|
59 | 92 | call void @llvm.amdgcn.raw.tbuffer.store.f16(half %data, <4 x i32> %rsrc, i32 0, i32 0, i32 33, i32 0)
|
60 | 93 | ret void
|
@@ -264,3 +297,6 @@ declare void @llvm.amdgcn.raw.tbuffer.store.f16(half, <4 x i32>, i32, i32, i32,
|
264 | 297 | declare void @llvm.amdgcn.raw.tbuffer.store.v2f16(<2 x half>, <4 x i32>, i32, i32, i32, i32)
|
265 | 298 | declare void @llvm.amdgcn.raw.tbuffer.store.v3f16(<3 x half>, <4 x i32>, i32, i32, i32, i32)
|
266 | 299 | declare void @llvm.amdgcn.raw.tbuffer.store.v4f16(<4 x half>, <4 x i32>, i32, i32, i32, i32)
|
| 300 | +;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line: |
| 301 | +; GFX12-PACKED-GISEL-FAKE16: {{.*}} |
| 302 | +; GFX12-PACKED-GISEL-TRUE16: {{.*}} |
0 commit comments