@@ -190,26 +190,25 @@ gpu.module @test {
190190
191191//-----
192192
193- // CHECK-LABEL: test_load
194- // CHECK-SAME: [[arg0:%.+]]: ui64
195- // CHECK-COUNT-2: xegpu.create_tdesc [[arg0]], {{.*}} : ui64, vector<16xindex> -> !xegpu.tensor_desc<16xf32, #xegpu.scatter_tdesc_attr<>>
196- // CHECK-COUNT-2: xegpu.load {{.*}} : !xegpu.tensor_desc<16xf32, #xegpu.scatter_tdesc_attr<>>, vector<16xi1> -> vector<16xf32>
197- gpu.func @test_load (%src: ui64 ) -> vector <32 xf32 > {
198- %cst = arith.constant dense <[
199- 0 , 8 , 16 , 24 , 32 , 40 , 48 , 56 ,
200- 64 , 72 , 80 , 88 , 96 , 104 , 112 , 120 ,
201- 128 , 136 , 144 , 152 , 160 , 168 , 176 , 184 ,
202- 192 , 200 , 208 , 216 , 224 , 232 , 240 , 248
203- ]> : vector <32 xindex >
193+ // CHECK-LABEL: test_load
194+ // CHECK-SAME: [[arg0:%.+]]: ui64
195+ // CHECK-COUNT-2: xegpu.create_tdesc [[arg0]], {{.*}} : ui64, vector<16xindex> -> !xegpu.tensor_desc<16xf32, #xegpu.scatter_tdesc_attr<>>
196+ // CHECK-COUNT-2: xegpu.load {{.*}} : !xegpu.tensor_desc<16xf32, #xegpu.scatter_tdesc_attr<>>, vector<16xi1> -> vector<16xf32>
197+ gpu.func @test_load (%src: ui64 ) -> vector <32 xf32 > {
198+ %cst = arith.constant dense <[
199+ 0 , 8 , 16 , 24 , 32 , 40 , 48 , 56 ,
200+ 64 , 72 , 80 , 88 , 96 , 104 , 112 , 120 ,
201+ 128 , 136 , 144 , 152 , 160 , 168 , 176 , 184 ,
202+ 192 , 200 , 208 , 216 , 224 , 232 , 240 , 248
203+ ]> : vector <32 xindex >
204204
205- %c17 = arith.constant 17 : index
206- %mask = vector.create_mask %c17: vector <32 xi1 >
207-
208- %tdesc = xegpu.create_tdesc %src , %cst : ui64 , vector <32 xindex > -> !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
209- %ld = xegpu.load %tdesc , %mask: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>, vector <32 xi1 > -> vector <32 xf32 >
205+ %c17 = arith.constant 17 : index
206+ %mask = vector.create_mask %c17: vector <32 xi1 >
207+ %tdesc = xegpu.create_tdesc %src , %cst : ui64 , vector <32 xindex > -> !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
208+ %ld = xegpu.load %tdesc , %mask: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>, vector <32 xi1 > -> vector <32 xf32 >
210209
211- gpu.return %ld : vector <32 xf32 >
212- }
210+ gpu.return %ld : vector <32 xf32 >
211+ }
213212
214213//-----
215214
@@ -219,17 +218,17 @@ gpu.module @test {
219218 // CHECK-COUNT-2: xegpu.prefetch {{.*}} : !xegpu.tensor_desc<16xf32, #xegpu.scatter_tdesc_attr<>>
220219 gpu.func @test_prefetch (%src: ui64 ) {
221220
222- %cst = arith.constant dense <[
223- 0 , 8 , 16 , 24 , 32 , 40 , 48 , 56 ,
224- 64 , 72 , 80 , 88 , 96 , 104 , 112 , 120 ,
225- 128 , 136 , 144 , 152 , 160 , 168 , 176 , 184 ,
226- 192 , 200 , 208 , 216 , 224 , 232 , 240 , 248
227- ]> : vector <32 xindex >
221+ %cst = arith.constant dense <[
222+ 0 , 8 , 16 , 24 , 32 , 40 , 48 , 56 ,
223+ 64 , 72 , 80 , 88 , 96 , 104 , 112 , 120 ,
224+ 128 , 136 , 144 , 152 , 160 , 168 , 176 , 184 ,
225+ 192 , 200 , 208 , 216 , 224 , 232 , 240 , 248
226+ ]> : vector <32 xindex >
228227
229- %tdesc = xegpu.create_tdesc %src , %cst : ui64 , vector <32 xindex > -> !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
228+ %tdesc = xegpu.create_tdesc %src , %cst : ui64 , vector <32 xindex > -> !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
230229
231- xegpu.prefetch %tdesc: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
232- gpu.return
230+ xegpu.prefetch %tdesc: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
231+ gpu.return
233232 }
234233
235234//-----
@@ -249,7 +248,7 @@ gpu.module @test {
249248 %c17 = arith.constant 17 : index
250249 %mask = vector.create_mask %c17: vector <32 xi1 >
251250
252- %st_vec = arith.constant dense <1023. >: vector <32 xf32 >
251+ %st_vec = arith.constant dense <1023.0 >: vector <32 xf32 >
253252 %tdesc = xegpu.create_tdesc %src , %cst : ui64 , vector <32 xindex > -> !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
254253 xegpu.store %st_vec , %tdesc , %mask: vector <32 xf32 >, !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>, vector <32 xi1 >
255254
@@ -268,37 +267,36 @@ gpu.module @test {
268267
269268 gpu.func @test_prefetch_load_store_update (%src: ui64 ) {
270269
271- %cst = arith.constant dense <[
272- 0 , 8 , 16 , 24 , 32 , 40 , 48 , 56 ,
273- 64 , 72 , 80 , 88 , 96 , 104 , 112 , 120 ,
274- 128 , 136 , 144 , 152 , 160 , 168 , 176 , 184 ,
275- 192 , 200 , 208 , 216 , 224 , 232 , 240 , 248
276- ]> : vector <32 xindex >
277-
278- %tdesc = xegpu.create_tdesc %src , %cst : ui64 , vector <32 xindex > -> !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
270+ %cst = arith.constant dense <[
271+ 0 , 8 , 16 , 24 , 32 , 40 , 48 , 56 ,
272+ 64 , 72 , 80 , 88 , 96 , 104 , 112 , 120 ,
273+ 128 , 136 , 144 , 152 , 160 , 168 , 176 , 184 ,
274+ 192 , 200 , 208 , 216 , 224 , 232 , 240 , 248
275+ ]> : vector <32 xindex >
279276
280- xegpu.prefetch %tdesc: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
277+ %tdesc = xegpu.create_tdesc %src , %cst : ui64 , vector <32 xindex > -> !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
278+ xegpu.prefetch %tdesc: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>
281279
282- %delta = arith.constant dense <[
283- 32 , 32 , 32 , 32 , 32 , 32 , 32 , 32 ,
284- 32 , 32 , 32 , 32 , 32 , 32 , 32 , 64 ,
285- 128 , 128 , 128 , 128 , 128 , 128 , 128 , 128 ,
286- 128 , 128 , 128 , 128 , 128 , 128 , 128 , 256
287- ]> : vector <32 xindex >
288- %new_tdesc = xegpu.update_offset %tdesc , %delta
289- : !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>, vector <32 xindex >
280+ %delta = arith.constant dense <[
281+ 32 , 32 , 32 , 32 , 32 , 32 , 32 , 32 ,
282+ 32 , 32 , 32 , 32 , 32 , 32 , 32 , 64 ,
283+ 128 , 128 , 128 , 128 , 128 , 128 , 128 , 128 ,
284+ 128 , 128 , 128 , 128 , 128 , 128 , 128 , 256
285+ ]> : vector <32 xindex >
286+ %new_tdesc = xegpu.update_offset %tdesc , %delta
287+ : !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>, vector <32 xindex >
290288
291- %c17 = arith.constant 17 : index
292- %mask = vector.create_mask %c17: vector <32 xi1 >
289+ %c17 = arith.constant 17 : index
290+ %mask = vector.create_mask %c17: vector <32 xi1 >
293291
294- %ld_vec = xegpu.load %new_tdesc , %mask: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>, vector <32 xi1 > -> vector <32 xf32 >
292+ %ld_vec = xegpu.load %new_tdesc , %mask: !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>, vector <32 xi1 > -> vector <32 xf32 >
295293
296- %st_vec = arith.addf %ld_vec , %ld_vec : vector <32 xf32 >
297- xegpu.store %st_vec , %tdesc , %mask:
294+ %st_vec = arith.addf %ld_vec , %ld_vec : vector <32 xf32 >
295+ xegpu.store %st_vec , %tdesc , %mask:
298296 vector <32 xf32 >,
299297 !xegpu.tensor_desc <32 xf32 , #xegpu.scatter_tdesc_attr <>, #xegpu.layout <inst_data = [16 ]>>,
300298 vector <32 xi1 >
301299
302- gpu.return
303- }
300+ gpu.return
301+ }
304302}
0 commit comments