@@ -11,7 +11,7 @@ func.func @matmul_riscv(%lhs: tensor<384x512xf32>, %rhs: tensor<512x128xf32>) ->
1111 %2 = linalg.matmul ins (%lhs , %rhs : tensor <384 x512 xf32 >, tensor <512 x128 xf32 >) outs (%1 : tensor <384 x128 xf32 >) -> tensor <384 x128 xf32 >
1212 return %2 : tensor <384 x128 xf32 >
1313}
14- // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[48, 64], [8, 32], [0, 0], [0, 0]]>
14+ // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[48, 64], [48, 64], [0, 0], [ 8, 32], [0, 0], [0, 0]]>
1515// CHECK-DAG: #[[CONFIG2:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[48, 64, 0], [48, 64, 0], [0, 0, 0], [8, 32, 0], [0, 0, 1], [0, 0, 0]]>
1616// CHECK-DAG: #[[TRANSLATION:.+]] = #iree_codegen.translation_info<pipeline = CPUDoubleTilingExpert, {{\{}}enable_loop_peeling}>
1717// CHECK: func.func @matmul_riscv(
@@ -31,7 +31,7 @@ func.func @matmul_gemm_riscv_vl512(%lhs: tensor<384x512xf32>, %rhs: tensor<512x1
3131 %res = linalg.matmul ins (%lhs , %rhs : tensor <384 x512 xf32 >, tensor <512 x128 xf32 >) outs (%fill : tensor <384 x128 xf32 >) -> tensor <384 x128 xf32 >
3232 return %res : tensor <384 x128 xf32 >
3333}
34- // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[64, 64], [7, 64], [0, 0], [0, 0]]>
34+ // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[64, 64], [64, 64], [0, 0], [ 7, 64], [0, 0], [0, 0]]>
3535// CHECK-DAG: #[[CONFIG2:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[64, 64, 0], [64, 64, 0], [0, 0, 0], [7, 64, 0], [0, 0, 1], [0, 0, 0]]>
3636// CHECK-DAG: #[[TRANSLATION:.+]] = #iree_codegen.translation_info<pipeline = CPUDoubleTilingExpert, {{\{}}enable_loop_peeling}>
3737// CHECK: func.func @matmul_gemm_riscv_vl512(
@@ -51,15 +51,15 @@ func.func @matmul_gemm_riscv_vl1024(%lhs: tensor<384x512xf32>, %rhs: tensor<512x
5151 %res = linalg.matmul ins (%lhs , %rhs : tensor <384 x512 xf32 >, tensor <512 x256 xf32 >) outs (%fill : tensor <384 x256 xf32 >) -> tensor <384 x256 xf32 >
5252 return %res : tensor <384 x256 xf32 >
5353}
54- // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[64, 128], [7, 128], [0, 0], [0, 0]]>
54+ // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[64, 128], [64, 128], [0, 0], [ 7, 128], [0, 0], [0, 0]]>
5555// CHECK-DAG: #[[CONFIG2:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[64, 128, 0], [64, 128, 0], [0, 0, 0], [7, 128, 0], [0, 0, 1], [0, 0, 0]]>
5656// CHECK-DAG: #[[TRANSLATION:.+]] = #iree_codegen.translation_info<pipeline = CPUDoubleTilingExpert, {{\{}}enable_loop_peeling}>
5757// CHECK: func.func @matmul_gemm_riscv_vl1024(
5858// CHECK-SAME: translation_info = #[[TRANSLATION]]
5959// CHECK: linalg.matmul
6060// CHECK-SAME: lowering_config = #[[CONFIG2]]
6161
62- // CHECK-AGGRESSIVE-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[32, 256], [7, 128], [0, 0], [0, 0]]>
62+ // CHECK-AGGRESSIVE-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[32, 256], [32, 256], [0, 0], [ 7, 128], [0, 0], [0, 0]]>
6363// CHECK-AGGRESSIVE-DAG: #[[CONFIG2:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[32, 256, 0], [32, 256, 0], [0, 0, 0], [7, 128, 0], [0, 0, 1], [0, 0, 0]]>
6464// CHECK-AGGRESSIVE-DAG: #[[TRANSLATION:.+]] = #iree_codegen.translation_info<pipeline = CPUDoubleTilingExpert, {{\{}}enable_loop_peeling}>
6565// CHECK-AGGRESSIVE: func.func @matmul_gemm_riscv_vl1024(
@@ -79,7 +79,7 @@ func.func @matmul_gemv_riscv_vl512(%lhs: tensor<1x512xf32>, %rhs: tensor<512x128
7979 %res = linalg.matmul ins (%lhs , %rhs : tensor <1 x512 xf32 >, tensor <512 x128 xf32 >) outs (%fill : tensor <1 x128 xf32 >) -> tensor <1 x128 xf32 >
8080 return %res : tensor <1 x128 xf32 >
8181}
82- // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[0, 128], [1, 128], [0, 0], [0, 0]]>
82+ // CHECK-DAG: #[[CONFIG:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[0, 128], [0, 128], [0, 0], [ 1, 128], [0, 0], [0, 0]]>
8383// CHECK-DAG: #[[CONFIG2:.+]] = #iree_codegen.lowering_config<tile_sizes = {{\[}}[0, 128, 0], [0, 128, 0], [0, 0, 0], [1, 128, 0], [0, 0, 1], [0, 0, 0]]>
8484// CHECK-DAG: #[[TRANSLATION:.+]] = #iree_codegen.translation_info<pipeline = CPUDoubleTilingExpert, {{\{}}enable_loop_peeling}>
8585// CHECK: func.func @matmul_gemv_riscv_vl512(
0 commit comments