@@ -370,31 +370,31 @@ gpu.module @test_distribution {
370370 // CHECK-LABEL: vector_step_op
371371 gpu.func @vector_step_op_slice_attr () {
372372 //CHECK: [[sgId:%.+]] = gpu.subgroup_id : index
373- //CHECK: [[IDY:%.+]] = affine.apply #map2()[[[sgId]]]
374- //CHECK: [[c32:%.+]] = arith.constant 32 : index
375- //CHECK: [[LOCALY:%.+]] = index.mul [[IDY]], [[c32]]
376- //CHECK: [[c0:%.+]] = arith.constant 0 : index
377- //CHECK: [[Y:%.+]] = arith.addi [[LOCALY]], [[c0]] : index
378- //CHECK: [[c128:%.+]] = arith.constant 128 : index
379- //CHECK: [[MODY:%.+]] = index.remu [[Y]], [[c128]]
380- //CHECK: [[BASE:%.+]] = vector.step : vector<32xindex>
381- //CHECK: [[CAST:%.+]] = vector.broadcast [[MODY]] : index to vector<32xindex>
373+ //CHECK-DAG : [[IDY:%.+]] = affine.apply #map2()[[[sgId]]]
374+ //CHECK-DAG : [[c32:%.+]] = arith.constant 32 : index
375+ //CHECK-DAG : [[LOCALY:%.+]] = index.mul [[IDY]], [[c32]]
376+ //CHECK-DAG : [[c0:%.+]] = arith.constant 0 : index
377+ //CHECK-DAG : [[Y:%.+]] = arith.addi [[LOCALY]], [[c0]] : index
378+ //CHECK-DAG : [[c128:%.+]] = arith.constant 128 : index
379+ //CHECK-DAG : [[MODY:%.+]] = index.remu [[Y]], [[c128]]
380+ //CHECK-DAG : [[BASE:%.+]] = vector.step : vector<32xindex>
381+ //CHECK-DAG : [[CAST:%.+]] = vector.broadcast [[MODY]] : index to vector<32xindex>
382382 //CHECK: [[ADD:%.+]] = arith.addi [[BASE]], [[CAST]] : vector<32xindex>
383383 %step = vector.step {layout_result_0 = #xegpu.slice <#xegpu.layout <sg_layout = [4 , 8 ], sg_data = [32 , 32 ]>, dims = [1 ]>}: vector <128 xindex >
384384 gpu.return
385385 }
386386
387387 gpu.func @vector_step_op_layout_attr () {
388388 //CHECK: [[sgId:%.+]] = gpu.subgroup_id : index
389- //CHECK: [[c16:%.+]] = arith.constant 16 : index
390- //CHECK: [[c8:%.+]] = arith.constant 8 : index
391- //CHECK: [[LOCALY:%.+]] = index.mul [[sgId]], [[c8]]
392- //CHECK: [[c0:%.+]] = arith.constant 0 : index
393- //CHECK: [[Y:%.+]] = arith.addi [[LOCALY]], [[c0]] : index
394- //CHECK: [[c128:%.+]] = arith.constant 128 : index
395- //CHECK: [[MODY:%.+]] = index.remu [[Y]], [[c128]]
396- //CHECK: [[BASE:%.+]] = vector.step : vector<8xindex>
397- //CHECK: [[CAST:%.+]] = vector.broadcast [[MODY]] : index to vector<8xindex>
389+ //CHECK-DAG : [[c16:%.+]] = arith.constant 16 : index
390+ //CHECK-DAG : [[c8:%.+]] = arith.constant 8 : index
391+ //CHECK-DAG : [[LOCALY:%.+]] = index.mul [[sgId]], [[c8]]
392+ //CHECK-DAG : [[c0:%.+]] = arith.constant 0 : index
393+ //CHECK-DAG : [[Y:%.+]] = arith.addi [[LOCALY]], [[c0]] : index
394+ //CHECK-DAG : [[c128:%.+]] = arith.constant 128 : index
395+ //CHECK-DAG : [[MODY:%.+]] = index.remu [[Y]], [[c128]]
396+ //CHECK-DAG : [[BASE:%.+]] = vector.step : vector<8xindex>
397+ //CHECK-DAG : [[CAST:%.+]] = vector.broadcast [[MODY]] : index to vector<8xindex>
398398 //CHECK: [[ADD:%.+]] = arith.addi [[BASE]], [[CAST]] : vector<8xindex>
399399 %step = vector.step {layout_result_0 = #xegpu.layout <sg_layout = [16 ], sg_data = [8 ]>}: vector <128 xindex >
400400 gpu.return
@@ -414,8 +414,8 @@ gpu.module @test_distribution {
414414 %load = xegpu.load_nd %tdesc [0 , 0 ]
415415 : !xegpu.tensor_desc <256 x128 xf32 , #xegpu.layout <sg_layout = [8 , 4 ], sg_data = [32 , 32 ], lane_layout = [1 , 16 ], lane_data = [1 , 1 ]>>
416416 -> vector <256 x128 xf32 >
417- //CHECK: vector.shape_cast {{.*}} : vector<32x32xf32> to vector<8x4x8x4xf32 >
418- %cast = vector.shape_cast %load {layout_result_0 = #xegpu.layout <sg_layout = [2 , 4 , 2 , 2 ], sg_data = [8 , 4 , 8 , 4 ]>} : vector <256 x128 xf32 > to vector <16 x16 x16 x8 xf32 >
417+ //CHECK: vector.shape_cast {{.*}} : vector<32x32xf32> to vector<2x16x4x8xf32 >
418+ %cast = vector.shape_cast %load {layout_result_0 = #xegpu.layout <sg_layout = [8 , 1 , 4 , 1 ], sg_data = [2 , 16 , 4 , 8 ]>} : vector <256 x128 xf32 > to vector <16 x16 x16 x8 xf32 >
419419 gpu.return
420420 }
421421}
0 commit comments