@@ -46,33 +46,3 @@ func.func @genbool_var_1d_scalable(%arg0: index) -> vector<[11]xi1> {
4646 %0 = vector.create_mask %arg0 : vector <[11 ]xi1 >
4747 return %0 : vector <[11 ]xi1 >
4848}
49-
50- // CMP32-LABEL: @transfer_read_1d
51- // CMP32: %[[MEM:.*]]: memref<?xf32>, %[[OFF:.*]]: index) -> vector<16xf32> {
52- // CMP32: %[[D:.*]] = memref.dim %[[MEM]], %{{.*}} : memref<?xf32>
53- // CMP32: %[[S:.*]] = arith.subi %[[D]], %[[OFF]] : index
54- // CMP32: %[[C:.*]] = arith.constant dense<[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]> : vector<16xi32>
55- // CMP32: %[[B:.*]] = arith.index_cast %[[S]] : index to i32
56- // CMP32: %[[B0:.*]] = llvm.insertelement %[[B]], %{{.*}} : vector<16xi32>
57- // CMP32: %[[BV:.*]] = llvm.shufflevector %[[B0]], {{.*}} : vector<16xi32>
58- // CMP32: %[[M:.*]] = arith.cmpi slt, %[[C]], %[[BV]] : vector<16xi32>
59- // CMP32: %[[L:.*]] = llvm.intr.masked.load %{{.*}}, %[[M]], %{{.*}}
60- // CMP32: return %[[L]] : vector<16xf32>
61-
62- // CMP64-LABEL: @transfer_read_1d(
63- // CMP64: %[[MEM:.*]]: memref<?xf32>, %[[OFF:.*]]: index) -> vector<16xf32> {
64- // CMP64: %[[D:.*]] = memref.dim %[[MEM]], %{{.*}} : memref<?xf32>
65- // CMP64: %[[S:.*]] = arith.subi %[[D]], %[[OFF]] : index
66- // CMP64: %[[C:.*]] = arith.constant dense<[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]> : vector<16xi64>
67- // CMP64: %[[B:.*]] = arith.index_cast %[[S]] : index to i64
68- // CMP64: %[[B0:.*]] = llvm.insertelement %[[B]], %{{.*}} : vector<16xi64>
69- // CMP64: %[[BV:.*]] = llvm.shufflevector %[[B0]], {{.*}} : vector<16xi64>
70- // CMP64: %[[M:.*]] = arith.cmpi slt, %[[C]], %[[BV]] : vector<16xi64>
71- // CMP64: %[[L:.*]] = llvm.intr.masked.load %{{.*}}, %[[M]], %{{.*}}
72- // CMP64: return %[[L]] : vector<16xf32>
73-
74- func.func @transfer_read_1d (%A : memref <?xf32 >, %i: index ) -> vector <16 xf32 > {
75- %d = arith.constant -1.0 : f32
76- %f = vector.transfer_read %A [%i ], %d {permutation_map = affine_map <(d0 ) -> (d0 )>} : memref <?xf32 >, vector <16 xf32 >
77- return %f : vector <16 xf32 >
78- }
0 commit comments