@@ -696,14 +696,14 @@ gpu.module @test_kernel {
696696 // CHECK: [[ins_0:%.+]] = vector.insert_strided_slice [[ld_0]], [[cst]] {offsets = [0, 0, 0], strides = [1]} : vector<16xf32> into vector<1x1x32xf32>
697697 // CHECK: [[ins_1:%.+]] = vector.insert_strided_slice [[ld_1]], [[ins_0]] {offsets = [0, 0, 16], strides = [1]} : vector<16xf32> into vector<1x1x32xf32>
698698 gpu.func @load_gather (%src: ui64 ) -> vector <1 x1 x32 xf32 > {
699- %cst = arith.constant dense <[[
699+ %cst = arith.constant { layout_result_0 = #xegpu.layout < inst_data = [ 1 , 1 , 16 ]>} dense <[[
700700 [0 , 8 , 16 , 24 , 32 , 40 , 48 , 56 ,
701701 64 , 72 , 80 , 88 , 96 , 104 , 112 , 120 ,
702702 128 , 136 , 144 , 152 , 160 , 168 , 176 , 184 ,
703703 192 , 200 , 208 , 216 , 224 , 232 , 240 , 248 ]
704704 ]]> : vector <1 x1 x32 xindex >
705705
706- %mask = arith.constant dense <true > : vector <1 x1 x32 xi1 >
706+ %mask = arith.constant { layout_result_0 = #xegpu.layout < inst_data = [ 1 , 1 , 16 ]>} dense <true > : vector <1 x1 x32 xi1 >
707707 %ld = xegpu.load %src [%cst ], %mask {chunk_size = 1 , layout_result_0 = #xegpu.layout <inst_data = [1 , 1 , 16 ]>, l1_hint = #xegpu.cache_hint <cached >} : ui64 , vector <1 x1 x32 xindex >, vector <1 x1 x32 xi1 > -> vector <1 x1 x32 xf32 >
708708
709709 gpu.return %ld : vector <1 x1 x32 xf32 >
@@ -751,4 +751,4 @@ gpu.module @test_kernel {
751751 xegpu.store_nd %result , %c_tdesc [%c0 , %c0 ] : vector <1 x32 xf32 >, !xegpu.tensor_desc <1 x32 xf32 , #l >
752752 gpu.return
753753 }
754- }
754+ }
0 commit comments