|
3 | 3 | ; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx810 -verify-machineinstrs | FileCheck -check-prefixes=PREGFX10-PACKED %s |
4 | 4 | ; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx900 -verify-machineinstrs | FileCheck -check-prefixes=PREGFX10-PACKED %s |
5 | 5 | ; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1010 -verify-machineinstrs | FileCheck -check-prefixes=GFX10-PACKED %s |
6 | | -; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1100 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX11-PACKED %s |
7 | | -; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1200 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-SDAG %s |
8 | | -; RUN: llc < %s -global-isel -mtriple=amdgcn -mcpu=gfx1200 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-GISEL %s |
| 6 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1100 -mattr=+real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX11-PACKED,GFX11-PACKED-TRUE16 %s |
| 7 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1100 -mattr=-real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX11-PACKED,GFX11-PACKED-FAKE16 %s |
| 8 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1200 -mattr=+real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-SDAG,GFX12-PACKED-SDAG-TRUE16 %s |
| 9 | +; RUN: llc < %s -mtriple=amdgcn -mcpu=gfx1200 -mattr=-real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-SDAG,GFX12-PACKED-SDAG-FAKE16 %s |
| 10 | +; RUN: llc < %s -global-isel -mtriple=amdgcn -mcpu=gfx1200 -mattr=+real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-GISEL,GFX12-PACKED-GISEL-TRUE16 %s |
| 11 | +; RUN: llc < %s -global-isel -mtriple=amdgcn -mcpu=gfx1200 -mattr=-real-true16 -amdgpu-enable-vopd=0 -verify-machineinstrs | FileCheck -check-prefixes=GFX12-PACKED,GFX12-PACKED-GISEL,GFX12-PACKED-GISEL-FAKE16 %s |
9 | 12 |
|
10 | 13 | define amdgpu_kernel void @tbuffer_store_d16_x(<4 x i32> %rsrc, half %data) { |
11 | 14 | ; PREGFX10-UNPACKED-LABEL: tbuffer_store_d16_x: |
@@ -36,25 +39,55 @@ define amdgpu_kernel void @tbuffer_store_d16_x(<4 x i32> %rsrc, half %data) { |
36 | 39 | ; GFX10-PACKED-NEXT: tbuffer_store_format_d16_x v0, off, s[0:3], 0 format:[BUF_FMT_10_11_11_SSCALED] |
37 | 40 | ; GFX10-PACKED-NEXT: s_endpgm |
38 | 41 | ; |
39 | | -; GFX11-PACKED-LABEL: tbuffer_store_d16_x: |
40 | | -; GFX11-PACKED: ; %bb.0: ; %main_body |
41 | | -; GFX11-PACKED-NEXT: s_clause 0x1 |
42 | | -; GFX11-PACKED-NEXT: s_load_b32 s6, s[4:5], 0x34 |
43 | | -; GFX11-PACKED-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
44 | | -; GFX11-PACKED-NEXT: s_waitcnt lgkmcnt(0) |
45 | | -; GFX11-PACKED-NEXT: v_mov_b32_e32 v0, s6 |
46 | | -; GFX11-PACKED-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], 0 format:[BUF_FMT_10_10_10_2_SNORM] |
47 | | -; GFX11-PACKED-NEXT: s_endpgm |
| 42 | +; GFX11-PACKED-TRUE16-LABEL: tbuffer_store_d16_x: |
| 43 | +; GFX11-PACKED-TRUE16: ; %bb.0: ; %main_body |
| 44 | +; GFX11-PACKED-TRUE16-NEXT: s_clause 0x1 |
| 45 | +; GFX11-PACKED-TRUE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 46 | +; GFX11-PACKED-TRUE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 47 | +; GFX11-PACKED-TRUE16-NEXT: s_waitcnt lgkmcnt(0) |
| 48 | +; GFX11-PACKED-TRUE16-NEXT: v_mov_b16_e32 v0.l, s6 |
| 49 | +; GFX11-PACKED-TRUE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], 0 format:[BUF_FMT_10_10_10_2_SNORM] |
| 50 | +; GFX11-PACKED-TRUE16-NEXT: s_endpgm |
48 | 51 | ; |
49 | | -; GFX12-PACKED-LABEL: tbuffer_store_d16_x: |
50 | | -; GFX12-PACKED: ; %bb.0: ; %main_body |
51 | | -; GFX12-PACKED-NEXT: s_clause 0x1 |
52 | | -; GFX12-PACKED-NEXT: s_load_b32 s6, s[4:5], 0x34 |
53 | | -; GFX12-PACKED-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
54 | | -; GFX12-PACKED-NEXT: s_wait_kmcnt 0x0 |
55 | | -; GFX12-PACKED-NEXT: v_mov_b32_e32 v0, s6 |
56 | | -; GFX12-PACKED-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
57 | | -; GFX12-PACKED-NEXT: s_endpgm |
| 52 | +; GFX11-PACKED-FAKE16-LABEL: tbuffer_store_d16_x: |
| 53 | +; GFX11-PACKED-FAKE16: ; %bb.0: ; %main_body |
| 54 | +; GFX11-PACKED-FAKE16-NEXT: s_clause 0x1 |
| 55 | +; GFX11-PACKED-FAKE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 56 | +; GFX11-PACKED-FAKE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 57 | +; GFX11-PACKED-FAKE16-NEXT: s_waitcnt lgkmcnt(0) |
| 58 | +; GFX11-PACKED-FAKE16-NEXT: v_mov_b32_e32 v0, s6 |
| 59 | +; GFX11-PACKED-FAKE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], 0 format:[BUF_FMT_10_10_10_2_SNORM] |
| 60 | +; GFX11-PACKED-FAKE16-NEXT: s_endpgm |
| 61 | +; |
| 62 | +; GFX12-PACKED-SDAG-TRUE16-LABEL: tbuffer_store_d16_x: |
| 63 | +; GFX12-PACKED-SDAG-TRUE16: ; %bb.0: ; %main_body |
| 64 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_clause 0x1 |
| 65 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 66 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 67 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_wait_kmcnt 0x0 |
| 68 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: v_mov_b16_e32 v0.l, s6 |
| 69 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
| 70 | +; GFX12-PACKED-SDAG-TRUE16-NEXT: s_endpgm |
| 71 | +; |
| 72 | +; GFX12-PACKED-SDAG-FAKE16-LABEL: tbuffer_store_d16_x: |
| 73 | +; GFX12-PACKED-SDAG-FAKE16: ; %bb.0: ; %main_body |
| 74 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_clause 0x1 |
| 75 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 76 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 77 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_wait_kmcnt 0x0 |
| 78 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: v_mov_b32_e32 v0, s6 |
| 79 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
| 80 | +; GFX12-PACKED-SDAG-FAKE16-NEXT: s_endpgm |
| 81 | +; |
| 82 | +; GFX12-PACKED-GISEL-LABEL: tbuffer_store_d16_x: |
| 83 | +; GFX12-PACKED-GISEL: ; %bb.0: ; %main_body |
| 84 | +; GFX12-PACKED-GISEL-NEXT: s_clause 0x1 |
| 85 | +; GFX12-PACKED-GISEL-NEXT: s_load_b32 s6, s[4:5], 0x34 |
| 86 | +; GFX12-PACKED-GISEL-NEXT: s_load_b128 s[0:3], s[4:5], 0x24 |
| 87 | +; GFX12-PACKED-GISEL-NEXT: s_wait_kmcnt 0x0 |
| 88 | +; GFX12-PACKED-GISEL-NEXT: v_mov_b32_e32 v0, s6 |
| 89 | +; GFX12-PACKED-GISEL-NEXT: tbuffer_store_d16_format_x v0, off, s[0:3], null format:[BUF_FMT_10_10_10_2_SNORM] |
| 90 | +; GFX12-PACKED-GISEL-NEXT: s_endpgm |
58 | 91 | main_body: |
59 | 92 | call void @llvm.amdgcn.raw.tbuffer.store.f16(half %data, <4 x i32> %rsrc, i32 0, i32 0, i32 33, i32 0) |
60 | 93 | ret void |
@@ -264,3 +297,6 @@ declare void @llvm.amdgcn.raw.tbuffer.store.f16(half, <4 x i32>, i32, i32, i32, |
264 | 297 | declare void @llvm.amdgcn.raw.tbuffer.store.v2f16(<2 x half>, <4 x i32>, i32, i32, i32, i32) |
265 | 298 | declare void @llvm.amdgcn.raw.tbuffer.store.v3f16(<3 x half>, <4 x i32>, i32, i32, i32, i32) |
266 | 299 | declare void @llvm.amdgcn.raw.tbuffer.store.v4f16(<4 x half>, <4 x i32>, i32, i32, i32, i32) |
| 300 | +;; NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line: |
| 301 | +; GFX12-PACKED-GISEL-FAKE16: {{.*}} |
| 302 | +; GFX12-PACKED-GISEL-TRUE16: {{.*}} |
0 commit comments