|
| 1 | +// RUN: mlir-vulkan-runner %s --shared-libs=%vulkan-runtime-wrappers,%mlir_runner_utils --entry-point-result=void | FileCheck %s |
| 2 | + |
| 3 | +// CHECK: [3.3, 3.3, 3.3, 3.3, 0, 0, 0, 0] |
| 4 | +module attributes { |
| 5 | + gpu.container_module, |
| 6 | + spirv.target_env = #spirv.target_env< |
| 7 | + #spirv.vce<v1.0, [Shader], [SPV_KHR_storage_buffer_storage_class]>, #spirv.resource_limits<>> |
| 8 | +} { |
| 9 | + gpu.module @kernels { |
| 10 | + gpu.func @kernel_add(%arg0 : memref<8xf32>, %arg1 : memref<8xf32>, %arg2 : memref<8xf32>) |
| 11 | + kernel attributes { spirv.entry_point_abi = #spirv.entry_point_abi<workgroup_size = [1, 1, 1]>} { |
| 12 | + %0 = gpu.block_id x |
| 13 | + %limit = arith.constant 4 : index |
| 14 | + %cond = arith.cmpi slt, %0, %limit : index |
| 15 | + scf.if %cond { |
| 16 | + %1 = memref.load %arg0[%0] : memref<8xf32> |
| 17 | + %2 = memref.load %arg1[%0] : memref<8xf32> |
| 18 | + %3 = arith.addf %1, %2 : f32 |
| 19 | + memref.store %3, %arg2[%0] : memref<8xf32> |
| 20 | + } |
| 21 | + gpu.return |
| 22 | + } |
| 23 | + } |
| 24 | + |
| 25 | + func.func @main() { |
| 26 | + %arg0 = memref.alloc() : memref<8xf32> |
| 27 | + %arg1 = memref.alloc() : memref<8xf32> |
| 28 | + %arg2 = memref.alloc() : memref<8xf32> |
| 29 | + %0 = arith.constant 0 : i32 |
| 30 | + %1 = arith.constant 1 : i32 |
| 31 | + %2 = arith.constant 2 : i32 |
| 32 | + %value0 = arith.constant 0.0 : f32 |
| 33 | + %value1 = arith.constant 1.1 : f32 |
| 34 | + %value2 = arith.constant 2.2 : f32 |
| 35 | + %arg3 = memref.cast %arg0 : memref<8xf32> to memref<?xf32> |
| 36 | + %arg4 = memref.cast %arg1 : memref<8xf32> to memref<?xf32> |
| 37 | + %arg5 = memref.cast %arg2 : memref<8xf32> to memref<?xf32> |
| 38 | + call @fillResource1DFloat(%arg3, %value1) : (memref<?xf32>, f32) -> () |
| 39 | + call @fillResource1DFloat(%arg4, %value2) : (memref<?xf32>, f32) -> () |
| 40 | + call @fillResource1DFloat(%arg5, %value0) : (memref<?xf32>, f32) -> () |
| 41 | + |
| 42 | + %cst1 = arith.constant 1 : index |
| 43 | + %cst8 = arith.constant 8 : index |
| 44 | + gpu.launch_func @kernels::@kernel_add |
| 45 | + blocks in (%cst8, %cst1, %cst1) threads in (%cst1, %cst1, %cst1) |
| 46 | + args(%arg0 : memref<8xf32>, %arg1 : memref<8xf32>, %arg2 : memref<8xf32>) |
| 47 | + %arg6 = memref.cast %arg5 : memref<?xf32> to memref<*xf32> |
| 48 | + call @printMemrefF32(%arg6) : (memref<*xf32>) -> () |
| 49 | + return |
| 50 | + } |
| 51 | + func.func private @fillResource1DFloat(%0 : memref<?xf32>, %1 : f32) |
| 52 | + func.func private @printMemrefF32(%ptr : memref<*xf32>) |
| 53 | +} |
| 54 | + |
0 commit comments