33//CHECK: #map = affine_map<()[s0] -> (s0 floordiv 4)>
44//CHECK: #map1 = affine_map<()[s0] -> (s0 mod 4)>
55gpu.module @test_1_1_assignment {
6- // CHECK-LABEL: test_create_nd_tdesc
6+ // CHECK-LABEL: create_nd_tdesc
77 // CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
8- gpu.func @test_create_nd_tdesc (%src: memref <24 x32 xf32 >) {
8+ gpu.func @create_nd_tdesc (%src: memref <24 x32 xf32 >) {
99 // CHECK: %[[SGID:.*]] = gpu.subgroup_id
1010 // CHECK: %[[C12:.*]] = arith.constant 12 : index
1111 // CHECK: %[[C4:.*]] = arith.constant 4 : index
@@ -30,9 +30,9 @@ gpu.module @test_1_1_assignment {
3030 gpu.return
3131 }
3232
33- // CHECK-LABEL: test_load_nd_tdesc
33+ // CHECK-LABEL: load_nd_tdesc
3434 // CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
35- gpu.func @test_load_nd_tdesc (%src: memref <24 x32 xf32 >) {
35+ gpu.func @load_nd_tdesc (%src: memref <24 x32 xf32 >) {
3636 // CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
3737 // CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
3838 // CHECK: %[[LOAD:.*]] = xegpu.load_nd %[[TDESC]]
@@ -46,9 +46,9 @@ gpu.module @test_1_1_assignment {
4646 gpu.return
4747 }
4848
49- // CHECK-LABEL: test_store_nd
49+ // CHECK-LABEL: store_nd
5050 // CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
51- gpu.func @test_store_nd (%src: memref <24 x32 xf32 >) {
51+ gpu.func @store_nd (%src: memref <24 x32 xf32 >) {
5252 // CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
5353 // CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
5454 // CHECK: %[[LOAD:.*]] = xegpu.load_nd %[[TDESC]]
@@ -66,9 +66,9 @@ gpu.module @test_1_1_assignment {
6666 gpu.return
6767}
6868
69- // CHECK-LABEL: test_update_nd
69+ // CHECK-LABEL: update_nd
7070// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
71- gpu.func @test_update_nd (%src: memref <24 x32 xf32 >){
71+ gpu.func @update_nd (%src: memref <24 x32 xf32 >){
7272 // CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
7373 // CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
7474 // CHECK: %[[UPDATE:.*]] = xegpu.update_nd_offset %[[TDESC]], [0, 16]
@@ -80,10 +80,10 @@ gpu.func @test_update_nd(%src: memref<24x32xf32>){
8080 gpu.return
8181}
8282
83- // CHECK-LABEL: test_dpas
83+ // CHECK-LABEL: dpas
8484// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
8585// CHECK-SAME: %[[ARG_1:.*]]: memref<32x24xf32>
86- gpu.func @test_dpas (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
86+ gpu.func @dpas (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
8787 // CHECK: %[[TDESC_A:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
8888 // CHECk-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
8989 // CHECK: %[[LOAD_A:.*]] = xegpu.load_nd %[[TDESC_A]]
@@ -114,10 +114,10 @@ gpu.func @test_dpas(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
114114 }
115115
116116
117- // CHECK-LABEL: test_dpas_no_sg_data
117+ // CHECK-LABEL: dpas_no_sg_data
118118// CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
119119// CHECK-SAME: %[[ARG_1:.*]]: memref<32x24xf32>
120- gpu.func @test_dpas_no_sg_data (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
120+ gpu.func @dpas_no_sg_data (%a: memref <24 x32 xf32 >, %b: memref <32 x24 xf32 >) {
121121 // CHECK: %[[TDESC_A:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
122122 // CHECk-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
123123 // CHECK: %[[LOAD_A:.*]] = xegpu.load_nd %[[TDESC_A]]
@@ -147,9 +147,9 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
147147 gpu.return
148148 }
149149
150- // CHECK-LABEL: test_prefetch_nd_tdesc
150+ // CHECK-LABEL: prefetch_nd_tdesc
151151 // CHECK-SAME: %[[ARG_0:.*]]: memref<24x32xf32>
152- gpu.func @test_prefetch_nd_tdesc (%src: memref <24 x32 xf32 >) {
152+ gpu.func @prefetch_nd_tdesc (%src: memref <24 x32 xf32 >) {
153153 // CHECK: %[[TDESC:.*]] = xegpu.create_nd_tdesc %[[ARG_0]][{{%.*}}, {{%.*}}] : memref<24x32xf32>
154154 // CHECK-SAME: -> !xegpu.tensor_desc<12x8xf32, #xegpu.layout<lane_layout = [2, 8], lane_data = [1, 1]>>
155155 // CHECK: xegpu.prefetch_nd %[[TDESC]]
@@ -161,16 +161,16 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
161161 gpu.return
162162 }
163163
164- // CHECK-LABEL: test_dpas_with_no_create_nd_desc
165- gpu.func @test_dpas_with_no_create_nd_desc (%a: vector <24 x32 xf32 >, %b: vector <32 x24 xf32 >) {
164+ // CHECK-LABEL: dpas_with_no_create_nd_desc
165+ gpu.func @dpas_with_no_create_nd_desc (%a: vector <24 x32 xf32 >, %b: vector <32 x24 xf32 >) {
166166 // CHECK-NOT: vector<12x12xf32>
167167 %dpas = xegpu.dpas %a , %b
168168 {layout = #xegpu.layout <sg_layout = [2 , 2 ], sg_data = [12 , 12 ], lane_layout = [2 , 2 ], lane_data = [1 , 1 ]>}
169169 : vector <24 x32 xf32 >, vector <32 x24 xf32 > -> vector <24 x24 xf32 >
170170 gpu.return
171171 }
172172
173- gpu.func @test_scf_for (%arg0: memref <1024 x1024 xf16 >, %arg1: memref <1024 x1024 xf16 >, %arg2: memref <1024 x1024 xf32 >) {
173+ gpu.func @scf_for (%arg0: memref <1024 x1024 xf16 >, %arg1: memref <1024 x1024 xf16 >, %arg2: memref <1024 x1024 xf32 >) {
174174 //CHECK: [[c0:%.+]] = arith.constant 0 : index
175175 //CHECK: [[c128:%.+]] = arith.constant 128 : index
176176 //CHECK: [[c1024:%.+]] = arith.constant 1024 : index
@@ -213,7 +213,7 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
213213 gpu.return
214214 }
215215
216- gpu.func @test_scf_while_and_condition (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
216+ gpu.func @scf_while_and_condition (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
217217 %c1_i32 = arith.constant 1 : i32
218218 %c10_i32 = arith.constant 10 : i32
219219 %c0_i32 = arith.constant 0 : i32
@@ -238,7 +238,7 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
238238 gpu.return
239239 }
240240
241- gpu.func @test_scf_if (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
241+ gpu.func @scf_if (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
242242 %c10 = arith.constant 10 : index
243243 %id = gpu.subgroup_id : index
244244
@@ -267,7 +267,7 @@ gpu.func @test_dpas_no_sg_data(%a: memref<24x32xf32>, %b: memref<32x24xf32>) {
267267 gpu.return
268268 }
269269
270- gpu.func @test_scf_if_tensor_desc (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
270+ gpu.func @scf_if_tensor_desc (%arg0: memref <1024 xf32 >, %arg1: memref <1024 xf32 >) {
271271 %c10 = arith.constant 10 : index
272272 %id = gpu.subgroup_id : index
273273
0 commit comments