66func.func @vector_transfer_ops_0d_memref (%mem: memref <f32 >, %vec: vector <1 x1 x1 xf32 >) {
77 %f0 = arith.constant 0.0 : f32
88
9- // CHECK-NEXT: %[[S:.*]] = memref.load %[[MEM]][] : memref<f32>
10- // CHECK-NEXT: %[[V:.*]] = vector.broadcast %[[S]] : f32 to vector<f32>
9+ // CHECK-NEXT: %[[S:.*]] = vector.load %[[MEM]][] : memref<f32>, vector<f32>
1110 %0 = vector.transfer_read %mem [], %f0 : memref <f32 >, vector <f32 >
1211
13- // CHECK-NEXT: %[[SS:.*]] = vector.extractelement %[[V]][] : vector<f32>
14- // CHECK-NEXT: memref.store %[[SS]], %[[MEM]][] : memref<f32>
12+ // CHECK-NEXT: vector.store %[[S]], %[[MEM]][] : memref<f32>, vector<f32>
1513 vector.transfer_write %0 , %mem [] : vector <f32 >, memref <f32 >
1614
17- // CHECK-NEXT: %[[VV:.*]] = vector.extract %arg1[0, 0, 0] : f32 from vector<1x1x1xf32>
18- // CHECK-NEXT: memref.store %[[VV]], %[[MEM]][] : memref<f32>
15+ // CHECK-NEXT: vector.store %[[VEC]], %[[MEM]][] : memref<f32>, vector<1x1x1xf32>
1916 vector.store %vec , %mem [] : memref <f32 >, vector <1 x1 x1 xf32 >
2017
2118 return
@@ -191,8 +188,8 @@ func.func @transfer_perm_map(%mem : memref<8x8xf32>, %idx : index) -> vector<4xf
191188// CHECK-LABEL: func @transfer_broadcasting(
192189// CHECK-SAME: %[[MEM:.*]]: memref<8x8xf32>,
193190// CHECK-SAME: %[[IDX:.*]]: index) -> vector<4xf32> {
194- // CHECK-NEXT: %[[LOAD:.*]] = memref .load %[[MEM]][%[[IDX]], %[[IDX]]] : memref<8x8xf32>
195- // CHECK-NEXT: %[[RES:.*]] = vector.broadcast %[[LOAD]] : f32 to vector<4xf32>
191+ // CHECK-NEXT: %[[LOAD:.*]] = vector .load %[[MEM]][%[[IDX]], %[[IDX]]] : memref<8x8xf32>, vector<1xf32 >
192+ // CHECK-NEXT: %[[RES:.*]] = vector.broadcast %[[LOAD]] : vector<1xf32> to vector<4xf32>
196193// CHECK-NEXT: return %[[RES]] : vector<4xf32>
197194// CHECK-NEXT: }
198195
@@ -208,8 +205,7 @@ func.func @transfer_broadcasting(%mem : memref<8x8xf32>, %idx : index) -> vector
208205// CHECK-LABEL: func @transfer_scalar(
209206// CHECK-SAME: %[[MEM:.*]]: memref<?x?xf32>,
210207// CHECK-SAME: %[[IDX:.*]]: index) -> vector<1xf32> {
211- // CHECK-NEXT: %[[LOAD:.*]] = memref.load %[[MEM]][%[[IDX]], %[[IDX]]] : memref<?x?xf32>
212- // CHECK-NEXT: %[[RES:.*]] = vector.broadcast %[[LOAD]] : f32 to vector<1xf32>
208+ // CHECK-NEXT: %[[RES:.*]] = vector.load %[[MEM]][%[[IDX]], %[[IDX]]] : memref<?x?xf32>, vector<1xf32>
213209// CHECK-NEXT: return %[[RES]] : vector<1xf32>
214210// CHECK-NEXT: }
215211func.func @transfer_scalar (%mem : memref <?x?xf32 >, %idx : index ) -> vector <1 xf32 > {
@@ -222,8 +218,8 @@ func.func @transfer_scalar(%mem : memref<?x?xf32>, %idx : index) -> vector<1xf32
222218// CHECK-LABEL: func @transfer_broadcasting_2D(
223219// CHECK-SAME: %[[MEM:.*]]: memref<8x8xf32>,
224220// CHECK-SAME: %[[IDX:.*]]: index) -> vector<4x4xf32> {
225- // CHECK-NEXT: %[[LOAD:.*]] = memref .load %[[MEM]][%[[IDX]], %[[IDX]]] : memref<8x8xf32>
226- // CHECK-NEXT: %[[RES:.*]] = vector.broadcast %[[LOAD]] : f32 to vector<4x4xf32>
221+ // CHECK-NEXT: %[[LOAD:.*]] = vector .load %[[MEM]][%[[IDX]], %[[IDX]]] : memref<8x8xf32>, vector<1x1xf32 >
222+ // CHECK-NEXT: %[[RES:.*]] = vector.broadcast %[[LOAD]] : vector<1x1xf32> to vector<4x4xf32>
227223// CHECK-NEXT: return %[[RES]] : vector<4x4xf32>
228224// CHECK-NEXT: }
229225
@@ -322,8 +318,8 @@ func.func @transfer_read_permutations(%mem_0 : memref<?x?xf32>, %mem_1 : memref<
322318// CHECK: vector.transpose %{{.*}}, [2, 1, 3, 0] : vector<16x14x7x8xf32> to vector<7x14x8x16xf32>
323319
324320 %6 = vector.transfer_read %mem_0 [%c0 , %c0 ], %cst {in_bounds = [true ], permutation_map = #map6 } : memref <?x?xf32 >, vector <8 xf32 >
325- // CHECK: memref .load %{{.*}}[%[[C0]], %[[C0]]] : memref<?x?xf32>
326- // CHECK: vector.broadcast %{{.*}} : f32 to vector<8xf32>
321+ // CHECK: vector .load %{{.*}}[%[[C0]], %[[C0]]] : memref<?x?xf32>, vector<1xf32 >
322+ // CHECK: vector.broadcast %{{.*}} : vector<1xf32> to vector<8xf32>
327323
328324 return %0 , %1 , %2 , %3 , %4 , %5 , %6 : vector <7 x14 x8 x16 xf32 >, vector <7 x14 x8 x16 xf32 >,
329325 vector <7 x14 x8 x16 xf32 >, vector <7 x14 x8 x16 xf32 >, vector <7 x14 x8 x16 xf32 >,
0 commit comments