@@ -162,14 +162,14 @@ gpu.func @create_nd_tdesc_non_memref(%arg0: ui64, %arg1: ui64,
162162}
163163
164164// -----
165- // CHECK-LABEL: gpu.func @test_update_nd_offset_1d (
165+ // CHECK-LABEL: gpu.func @update_nd_offset_1d (
166166// CHECK: %[[ARG0:[0-9a-zA-Z]+]]: memref<256xf32>) {
167167// CHECK: %[[CST:.*]] = arith.constant dense<1.000000e+00> : vector<1xf32>
168168// CHECK: %[[T0:.*]] = xegpu.create_nd_tdesc %[[ARG0]][%{{.*}}] : memref<256xf32> -> !xegpu.tensor_desc<16xf32>
169169// CHECK: %[[T1:.*]] = xegpu.update_nd_offset %[[T0]], [%c32] : !xegpu.tensor_desc<16xf32>
170170// CHECK: xegpu.store_nd %[[CST]], %[[T1]] : vector<1xf32>, !xegpu.tensor_desc<16xf32>
171171gpu.module @test {
172- gpu.func @test_update_nd_offset_1d (%arg0: memref <256 xf32 >){
172+ gpu.func @update_nd_offset_1d (%arg0: memref <256 xf32 >){
173173 %c0 = arith.constant 0 : index
174174 %c32 = arith.constant 32 : index
175175 %1 = arith.constant dense <1.000000e+00 > : vector <16 xf32 >
@@ -181,14 +181,14 @@ gpu.func @test_update_nd_offset_1d(%arg0: memref<256xf32>){
181181}
182182
183183// -----
184- // CHECK-LABEL: gpu.func @test_update_nd_offset_2d
184+ // CHECK-LABEL: gpu.func @update_nd_offset_2d
185185// CHECK: %[[ARG0:[0-9a-zA-Z]+]]: memref<256x256xf32>) {
186186// CHECK: %[[CST:.*]] = arith.constant dense<1.000000e+00> : vector<16xf32>
187187// CHECK: %[[T0:.*]] = xegpu.create_nd_tdesc %[[ARG0]][%{{.*}}] : memref<256x256xf32> -> !xegpu.tensor_desc<16x16xf32>
188188// CHECK: %[[T1:.*]] = xegpu.update_nd_offset %[[T0]], [%c32, %c32] : !xegpu.tensor_desc<16x16xf32>
189189// CHECK: xegpu.store_nd %[[CST]], %[[T1]] : vector<16xf32>, !xegpu.tensor_desc<16x16xf32>
190190gpu.module @test {
191- gpu.func @test_update_nd_offset_2d (%arg0: memref <256 x256 xf32 >){
191+ gpu.func @update_nd_offset_2d (%arg0: memref <256 x256 xf32 >){
192192 %c0 = arith.constant 0 : index
193193 %c32 = arith.constant 32 : index
194194 %1 = arith.constant dense <1.000000e+00 > : vector <16 x16 xf32 >
@@ -200,12 +200,12 @@ gpu.func @test_update_nd_offset_2d(%arg0: memref<256x256xf32>){
200200}
201201
202202// -----
203- // CHECK-LABEL: gpu.func @test_prefetch_2d
203+ // CHECK-LABEL: gpu.func @prefetch_2d
204204// CHECK: (%[[ARG0:[0-9a-zA-Z]+]]: memref<256x256xf16>) {
205205// CHECK: %[[T0:.*]] = xegpu.create_nd_tdesc %[[ARG0]][%{{.*}}] : memref<256x256xf16> -> !xegpu.tensor_desc<16x16xf16>
206206// CHECK: xegpu.prefetch_nd %[[T0]] <{l1_hint = #xegpu.cache_hint<cached>, l2_hint = #xegpu.cache_hint<uncached>}> : !xegpu.tensor_desc<16x16xf16>
207207gpu.module @test {
208- gpu.func @test_prefetch_2d (%arg0: memref <256 x256 xf16 >){
208+ gpu.func @prefetch_2d (%arg0: memref <256 x256 xf16 >){
209209 %c0 = arith.constant 0 : index
210210 %0 = xegpu.create_nd_tdesc %arg0 [%c0 , %c0 ] : memref <256 x256 xf16 > -> !xegpu.tensor_desc <16 x16 xf16 >
211211 xegpu.prefetch_nd %0 <{l1_hint = #xegpu.cache_hint <cached >, l2_hint = #xegpu.cache_hint <uncached >}>: !xegpu.tensor_desc <16 x16 xf16 >
@@ -214,12 +214,12 @@ gpu.func @test_prefetch_2d(%arg0: memref<256x256xf16>){
214214}
215215
216216// -----
217- // CHECK-LABEL: gpu.func @test_prefetch_1d
217+ // CHECK-LABEL: gpu.func @prefetch_1d
218218// CHECK: (%[[ARG0:[0-9a-zA-Z]+]]: memref<256xf16>) {
219219// CHECK: %[[T0:.*]] = xegpu.create_nd_tdesc %[[ARG0]][%{{.*}}] : memref<256xf16> -> !xegpu.tensor_desc<16xf16>
220220// CHECK: xegpu.prefetch_nd %[[T0]] <{l1_hint = #xegpu.cache_hint<cached>, l2_hint = #xegpu.cache_hint<uncached>}> : !xegpu.tensor_desc<16xf16>
221221gpu.module @test {
222- gpu.func @test_prefetch_1d (%arg0: memref <256 xf16 >){
222+ gpu.func @prefetch_1d (%arg0: memref <256 xf16 >){
223223 %c0 = arith.constant 0 : index
224224 %0 = xegpu.create_nd_tdesc %arg0 [%c0 ] : memref <256 xf16 > -> !xegpu.tensor_desc <16 xf16 >
225225 xegpu.prefetch_nd %0 <{l1_hint = #xegpu.cache_hint <cached >, l2_hint = #xegpu.cache_hint <uncached >}>: !xegpu.tensor_desc <16 xf16 >
@@ -229,7 +229,7 @@ gpu.func @test_prefetch_1d(%arg0: memref<256xf16>){
229229
230230
231231// -----
232- // CHECK-LABEL: gpu.func @test_gemm_loop
232+ // CHECK-LABEL: gpu.func @gemm_loop
233233// CHECK: (%[[ARG0:[0-9a-zA-Z]+]]: memref<1024x1024xbf16>, %[[ARG1:[0-9a-zA-Z]+]]: memref<1024x1024xbf16>, %[[ARG2:[0-9a-zA-Z]+]]: memref<1024x1024xf32>) {
234234// CHECK: %[[BLOCK_ID_Y:.*]] = gpu.block_id y
235235// CHECK: %[[Y_COORD:.*]] = arith.muli %[[BLOCK_ID_Y]], %c16 : index
@@ -252,7 +252,7 @@ gpu.func @test_prefetch_1d(%arg0: memref<256xf16>){
252252// CHECK: %[[T9:.*]] = vector.shape_cast %[[T5]] : vector<8x1xf32> to vector<8xf32>
253253// CHECK: xegpu.store_nd %[[T9]], %[[T8]] : vector<8xf32>, !xegpu.tensor_desc<8x16xf32>
254254gpu.module @test {
255- gpu.func @test_gemm_loop (%arg0: memref <1024 x1024 xbf16 >, %arg1: memref <1024 x1024 xbf16 >, %arg2: memref <1024 x1024 xf32 >){
255+ gpu.func @gemm_loop (%arg0: memref <1024 x1024 xbf16 >, %arg1: memref <1024 x1024 xbf16 >, %arg2: memref <1024 x1024 xf32 >){
256256 %c0 = arith.constant 0 : index
257257 %c16 = arith.constant 16 : index
258258 %c8 = arith.constant 8 : index
0 commit comments