|
| 1 | +// NOTE: Assertions have been autogenerated by utils/update_cc_test_checks.py UTC_ARGS: --check-globals smart |
| 2 | +// REQUIRES: amdgpu-registered-target |
| 3 | +// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -target-cpu gfx950 -emit-llvm -o - %s | FileCheck %s -check-prefixes=GFX,GFX950 |
| 4 | +// RUN: %clang_cc1 -triple amdgcn-unknown-unknown -target-cpu gfx9-4-generic -emit-llvm -o - %s | FileCheck %s -check-prefixes=GFX,GFX9_4_GENERIC |
| 5 | + |
| 6 | +typedef __attribute__((__vector_size__(4 * sizeof(unsigned int)))) unsigned int v4u32; |
| 7 | +typedef v4u32 __global *global_ptr_to_v4u32; |
| 8 | + |
| 9 | +//------------------------------------------------------------------------------ |
| 10 | +// Store |
| 11 | +//------------------------------------------------------------------------------ |
| 12 | +// GFX-LABEL: @test_amdgcn_global_store_b128_00( |
| 13 | +// GFX-NEXT: entry: |
| 14 | +// GFX-NEXT: tail call void @llvm.amdgcn.global.store.b128(ptr addrspace(1) [[PTR:%.*]], <4 x i32> [[DATA:%.*]], metadata [[META4:![0-9]+]]) |
| 15 | +// GFX-NEXT: ret void |
| 16 | +// |
| 17 | +void test_amdgcn_global_store_b128_00(global_ptr_to_v4u32 ptr, v4u32 data) { |
| 18 | + __builtin_amdgcn_global_store_b128(ptr, data, "wavefront"); |
| 19 | +} |
| 20 | + |
| 21 | +// GFX-LABEL: @test_amdgcn_global_store_b128_01( |
| 22 | +// GFX-NEXT: entry: |
| 23 | +// GFX-NEXT: tail call void @llvm.amdgcn.global.store.b128(ptr addrspace(1) [[PTR:%.*]], <4 x i32> [[DATA:%.*]], metadata [[META5:![0-9]+]]) |
| 24 | +// GFX-NEXT: ret void |
| 25 | +// |
| 26 | +void test_amdgcn_global_store_b128_01(global_ptr_to_v4u32 ptr, v4u32 data) { |
| 27 | + __builtin_amdgcn_global_store_b128(ptr, data, "workgroup"); |
| 28 | +} |
| 29 | + |
| 30 | +// GFX-LABEL: @test_amdgcn_global_store_b128_10( |
| 31 | +// GFX-NEXT: entry: |
| 32 | +// GFX-NEXT: tail call void @llvm.amdgcn.global.store.b128(ptr addrspace(1) [[PTR:%.*]], <4 x i32> [[DATA:%.*]], metadata [[META6:![0-9]+]]) |
| 33 | +// GFX-NEXT: ret void |
| 34 | +// |
| 35 | +void test_amdgcn_global_store_b128_10(global_ptr_to_v4u32 ptr, v4u32 data) { |
| 36 | + __builtin_amdgcn_global_store_b128(ptr, data, "agent"); |
| 37 | +} |
| 38 | + |
| 39 | +// GFX-LABEL: @test_amdgcn_global_store_b128_11( |
| 40 | +// GFX-NEXT: entry: |
| 41 | +// GFX-NEXT: tail call void @llvm.amdgcn.global.store.b128(ptr addrspace(1) [[PTR:%.*]], <4 x i32> [[DATA:%.*]], metadata [[META7:![0-9]+]]) |
| 42 | +// GFX-NEXT: ret void |
| 43 | +// |
| 44 | +void test_amdgcn_global_store_b128_11(global_ptr_to_v4u32 ptr, v4u32 data) { |
| 45 | + __builtin_amdgcn_global_store_b128(ptr, data, ""); |
| 46 | +} |
| 47 | + |
| 48 | +//------------------------------------------------------------------------------ |
| 49 | +// Load |
| 50 | +//------------------------------------------------------------------------------ |
| 51 | +// GFX-LABEL: @test_amdgcn_global_load_b128_00( |
| 52 | +// GFX-NEXT: entry: |
| 53 | +// GFX-NEXT: [[TMP0:%.*]] = tail call <4 x i32> @llvm.amdgcn.global.load.b128(ptr addrspace(1) [[PTR:%.*]], metadata [[META4]]) |
| 54 | +// GFX-NEXT: ret <4 x i32> [[TMP0]] |
| 55 | +// |
| 56 | +v4u32 test_amdgcn_global_load_b128_00(global_ptr_to_v4u32 ptr) { |
| 57 | + return __builtin_amdgcn_global_load_b128(ptr, "wavefront"); |
| 58 | +} |
| 59 | + |
| 60 | +// GFX-LABEL: @test_amdgcn_global_load_b128_01( |
| 61 | +// GFX-NEXT: entry: |
| 62 | +// GFX-NEXT: [[TMP0:%.*]] = tail call <4 x i32> @llvm.amdgcn.global.load.b128(ptr addrspace(1) [[PTR:%.*]], metadata [[META5]]) |
| 63 | +// GFX-NEXT: ret <4 x i32> [[TMP0]] |
| 64 | +// |
| 65 | +v4u32 test_amdgcn_global_load_b128_01(global_ptr_to_v4u32 ptr) { |
| 66 | + return __builtin_amdgcn_global_load_b128(ptr, "workgroup"); |
| 67 | +} |
| 68 | + |
| 69 | +// GFX-LABEL: @test_amdgcn_global_load_b128_10( |
| 70 | +// GFX-NEXT: entry: |
| 71 | +// GFX-NEXT: [[TMP0:%.*]] = tail call <4 x i32> @llvm.amdgcn.global.load.b128(ptr addrspace(1) [[PTR:%.*]], metadata [[META6]]) |
| 72 | +// GFX-NEXT: ret <4 x i32> [[TMP0]] |
| 73 | +// |
| 74 | +v4u32 test_amdgcn_global_load_b128_10(global_ptr_to_v4u32 ptr) { |
| 75 | + return __builtin_amdgcn_global_load_b128(ptr, "agent"); |
| 76 | +} |
| 77 | + |
| 78 | +// GFX-LABEL: @test_amdgcn_global_load_b128_11( |
| 79 | +// GFX-NEXT: entry: |
| 80 | +// GFX-NEXT: [[TMP0:%.*]] = tail call <4 x i32> @llvm.amdgcn.global.load.b128(ptr addrspace(1) [[PTR:%.*]], metadata [[META7]]) |
| 81 | +// GFX-NEXT: ret <4 x i32> [[TMP0]] |
| 82 | +// |
| 83 | +v4u32 test_amdgcn_global_load_b128_11(global_ptr_to_v4u32 ptr) { |
| 84 | + return __builtin_amdgcn_global_load_b128(ptr, ""); |
| 85 | +} |
| 86 | +//. |
| 87 | +// GFX950: [[META4]] = !{!"wavefront"} |
| 88 | +// GFX950: [[META5]] = !{!"workgroup"} |
| 89 | +// GFX950: [[META6]] = !{!"agent"} |
| 90 | +// GFX950: [[META7]] = !{!""} |
| 91 | +//. |
| 92 | +// GFX9_4_GENERIC: [[META4]] = !{!"wavefront"} |
| 93 | +// GFX9_4_GENERIC: [[META5]] = !{!"workgroup"} |
| 94 | +// GFX9_4_GENERIC: [[META6]] = !{!"agent"} |
| 95 | +// GFX9_4_GENERIC: [[META7]] = !{!""} |
| 96 | +//. |
| 97 | +//// NOTE: These prefixes are unused and the list is autogenerated. Do not add tests below this line: |
| 98 | +// GFX950: {{.*}} |
| 99 | +// GFX9_4_GENERIC: {{.*}} |
0 commit comments