Enable I8 and I1 testcases (#536)

chencha3 · web-flow · commit 9cc942fb2b5e · 2022-11-29T10:46:03.000-08:00
* add int8to32 cast

* enable int8 test cases

* enable Logicalxxx (i1) and BitNot (i8) test cases

* format fix
diff --git a/test/PlaidML/CppEdsl.BitNot.mlir b/test/PlaidML/CppEdsl.BitNot.mlir
@@ -11,11 +11,26 @@ module @bit_not {
 func.func @main() {
     %0= arith.constant dense<[[0, 1, 2], [16, 17, 34], [240, 15, 255]]>:tensor<3x3xi8>
     %1 = call @test(%0) : (tensor<3x3xi8>) -> tensor<3x3xi8>
-    %unranked = tensor.cast %1 : tensor<3x3xi8>to tensor<*xi8>
-    call @printMemrefI32(%unranked) : (tensor<*xi8>) -> ()
+    %2 = call @castI8toI32(%1): (tensor<3x3xi8>) -> tensor<3x3xi32>
+    %unranked = tensor.cast %2 : tensor<3x3xi32> to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
     return
 }
-func.func private @printMemrefI32(tensor<*xi8>)
+
+func.func @castI8toI32(%arg0: tensor<3x3xi8>) -> tensor<3x3xi32> {
+  %1 = tensor.empty() : tensor<3x3xi32>
+  %2 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]}
+       ins(%arg0: tensor<3x3xi8>)
+       outs(%1 : tensor<3x3xi32>)
+       attrs =  {iterator_ranges = [3, 3]} {
+  ^bb0(%arg1: i8, %arg2: i32):
+    %3 = arith.extui %arg1: i8 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3x3xi32>
+  return %2: tensor<3x3xi32>
+}
+
+func.func private @printMemrefI32(tensor<*xi32>)
 func.func @test(%arg0: tensor<3x3xi8>)->tensor<3x3xi8>{
     %0 = tensor.empty() : tensor<3x3xi8>
     %1 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]} ins(%arg0 : tensor<3x3xi8>) outs(%0 : tensor<3x3xi8>) {
diff --git a/test/PlaidML/CppEdsl.ConvI8.mlir b/test/PlaidML/CppEdsl.ConvI8.mlir
@@ -11,7 +11,7 @@
 #map2 = affine_map<(d0, d1, d2, d3, d4, d5, d6) -> (d4, d5, d6, d3)>
 #map3 = affine_map<(d0, d1, d2, d3, d4, d5, d6) -> (d0, d1, d2, d3)>
 module @convolution {
-func.func @test(%arg0: tensor<1x224x224x3xi8>, %arg1: tensor<3x3x3x32xi8>) -> tensor<1x224x224x32xi8> {
+  func.func @test(%arg0: tensor<1x224x224x3xi8>, %arg1: tensor<3x3x3x32xi8>) -> tensor<1x224x224x32xi8> {
     %c0_i8 = arith.constant 0 : i8
     %0 = tensor.empty() : tensor<1x224x224x3xi8>
     %1 = linalg.generic {indexing_maps = [#map0, #map0], iterator_types = ["parallel", "parallel", "parallel", "parallel"]} ins(%arg0 : tensor<1x224x224x3xi8>) outs(%0 : tensor<1x224x224x3xi8>) {
@@ -33,15 +33,31 @@ func.func @test(%arg0: tensor<1x224x224x3xi8>, %arg1: tensor<3x3x3x32xi8>) -> te
     } -> tensor<1x224x224x32xi8>
     return %5 : tensor<1x224x224x32xi8>
   }
+
   func.func @main() {
     %0 = arith.constant dense<1> : tensor<1x224x224x3xi8>
     %1 = arith.constant dense<1> : tensor<3x3x3x32xi8>
     %2 = call @test(%0, %1) : (tensor<1x224x224x3xi8>, tensor<3x3x3x32xi8>) -> tensor<1x224x224x32xi8>
-    %unranked = tensor.cast %2 : tensor<1x224x224x32xi8> to tensor<*xi8>
-    call @printMemrefI8(%unranked) : (tensor<*xi8>) -> ()
+    %3 = call @castI8toI32(%2): (tensor<1x224x224x32xi8>) -> tensor<1x224x224x32xi32>
+    %unranked = tensor.cast %3 : tensor<1x224x224x32xi32> to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
     return
   }
-    //      CHECK: Unranked Memref base@ = {{(0x)?[-9a-f]*}}
-    // CHECK-NEXT:
-  func.func private @printMemrefI8(tensor<*xi8>)
+
+  func.func @castI8toI32(%arg0: tensor<1x224x224x32xi8>) -> tensor<1x224x224x32xi32> {
+  %1 = tensor.empty() : tensor<1x224x224x32xi32>
+  %2 = linalg.generic {indexing_maps = [#map0, #map0], iterator_types = ["parallel", "parallel", "parallel", "parallel"]}
+       ins(%arg0: tensor<1x224x224x32xi8>)
+       outs(%1 : tensor<1x224x224x32xi32>)
+       attrs =  {iterator_ranges = [1, 224, 224, 32]} {
+  ^bb0(%arg1: i8, %arg2: i32):
+    %3 = arith.extui %arg1: i8 to i32
+    linalg.yield %3 : i32
+  } -> tensor<1x224x224x32xi32>
+  return %2: tensor<1x224x224x32xi32>
+}
+
+  //      CHECK: Unranked Memref base@ = {{(0x)?[-9a-f]*}}
+  // CHECK-NEXT: [12, 12]
+  func.func private @printMemrefI32(tensor<*xi32>)
 }
diff --git a/test/PlaidML/OpTest.ExplicitPaddingNegInf.mlir b/test/PlaidML/OpTest.ExplicitPaddingNegInf.mlir
@@ -0,0 +1,65 @@
+// RUN: %python_executable %imex_runner -i %s --pass-pipeline-file=%p/linalg-to-cpu.pp \
+// RUN:                                       --runner mlir-cpu-runner -e main \
+// RUN:                                       --shared-libs=%mlir_runner_utils \
+// RUN:                                       --entry-point-result=void | FileCheck %s
+// RUN: %gpu_skip || %python_executable %imex_runner -i %s --pass-pipeline-file=%p/linalg-to-llvm.pp \
+// RUN:                                       --runner mlir-cpu-runner -e main \
+// RUN:                                       --entry-point-result=void \
+// RUN:                                       --shared-libs=%mlir_runner_utils,%sycl_runtime | FileCheck %s
+#map0 = affine_map<(d0, d1) -> (d0, d1)>
+#map1 = affine_map<(d0, d1) -> (d0 + 2, d1 + 1)>
+module @explicit_padding {
+func.func @main() {
+    %0= arith.constant dense<[[1.0, 2.0, 3.0], [4.0, 5.0, 6.0]]>:tensor<2x3xf32>
+    %1 = call @test(%0) : (tensor<2x3xf32>) -> tensor<6x5xf32>
+    %unranked = tensor.cast %1 : tensor<6x5xf32>to tensor<*xf32>
+    call @printMemrefF32(%unranked) : (tensor<*xf32>) -> ()
+    return
+}
+func.func private @printMemrefF32(tensor<*xf32>)
+func.func @test(%arg0: tensor<2x3xf32>)->tensor<6x5xf32>{
+    %cst = arith.constant 0xFF800000 : f32
+    %zero = arith.constant 0.0: f32
+    %0 = tensor.empty() : tensor<6x5xf32>
+    %1 = linalg.fill ins(%cst : f32) outs(%0 : tensor<6x5xf32>) -> tensor<6x5xf32>
+    %2 = linalg.generic {indexing_maps = [#map0, #map1], iterator_types = ["parallel", "reduction"]} ins(%arg0 : tensor<2x3xf32>) outs(%1 : tensor<6x5xf32>) attrs =  {iterator_ranges = [2, 3], name = "explicit_padding"} {
+    ^bb0(%arg1: f32, %arg2: f32):
+      %m = arith.maxf %zero, %arg2: f32
+      %o = arith.addf %m, %arg1: f32
+      linalg.yield %o : f32
+    } -> tensor<6x5xf32>
+    return %2 : tensor<6x5xf32>
+  }
+}
+// CHECK: Unranked Memref base@ = {{0x[-9a-f]*}}
+// CHECK-SAME: rank = {{.}} offset = {{.}} sizes = [6, 5] strides = {{.*}} data =
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   1
+// CHECK:   2
+// CHECK:   3
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   4
+// CHECK:   5
+// CHECK:   6
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
+// CHECK:   -inf
diff --git a/test/PlaidML/OpTest.GEMM_INT32.mlir b/test/PlaidML/OpTest.GEMM_INT32.mlir
@@ -18,7 +18,7 @@ func.func @main() {
     %3 = call @test(%0,%1,%2) : (tensor<3x3xi32>,tensor<3x3xi32>,tensor<3x3xi32>) -> tensor<3x3xi32>
     %unranked = tensor.cast %3 : tensor<3x3xi32>to tensor<*xi32>
     call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
-     // CHECK: Unranked Memref base@ = {{(0x)?[-9a-f]*}}
+    // CHECK: Unranked Memref base@ = {{(0x)?[-9a-f]*}}
     // CHECK-NEXT: [40,   43,   46]
     // CHECK-NEXT: [56,   60,   64]
     // CHECK-NEXT: [118,   127,   136]
diff --git a/test/PlaidML/OpTest.GEMM_INT8.mlir b/test/PlaidML/OpTest.GEMM_INT8.mlir
@@ -13,16 +13,34 @@
 #map3 = affine_map<(d0, d1) -> (d0, d1)>
 module @gemm {
 func.func @main() {
-    %0= arith.constant dense<[[1, 2, 3], [1, 1, 1], [1, 1, 1]]>:tensor<3x3xi8>
-    %1 = arith.constant dense<[[1, 1, 1], [1, 2, 3], [1, 1, 1]]>:tensor<3x3xi8>
+    %0= arith.constant dense<[[1, 1, 1], [1, 1, 2], [3, 3, 3]]>:tensor<3x3xi8>
+    %1 = arith.constant dense<[[10, 11, 12], [13, 14, 15], [16, 17, 18]]>:tensor<3x3xi8>
     %2= arith.constant dense<[[1, 1, 1], [1, 1, 1], [1, 2, 3]]>:tensor<3x3xi8>
     %3 = call @test(%0,%1,%2) : (tensor<3x3xi8>,tensor<3x3xi8>,tensor<3x3xi8>) -> tensor<3x3xi8>
-    %unranked = tensor.cast %3 : tensor<3x3xi8>to tensor<*xi8>
-    call @printMemrefI8(%unranked) : (tensor<*xi8>) -> ()
-    // CHECK:
+    %4 = call @castI8toI32(%3): (tensor<3x3xi8>) -> tensor<3x3xi32>
+    %unranked = tensor.cast %4 : tensor<3x3xi32>to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
+    // CHECK: Unranked Memref base@ = {{(0x)?[-9a-f]*}}
+    // CHECK-NEXT: [40,   43,   46]
+    // CHECK-NEXT: [56,   60,   64]
+    // CHECK-NEXT: [118,   128,   138]
     return
 }
-func.func private @printMemrefI8(tensor<*xi8>)
+
+func.func @castI8toI32(%arg0: tensor<3x3xi8>) -> tensor<3x3xi32> {
+  %1 = tensor.empty() : tensor<3x3xi32>
+  %2 = linalg.generic {indexing_maps = [#map3, #map3], iterator_types = ["parallel", "parallel"]}
+       ins(%arg0: tensor<3x3xi8>)
+       outs(%1 : tensor<3x3xi32>)
+       attrs =  {iterator_ranges = [3, 3]} {
+  ^bb0(%arg1: i8, %arg2: i32):
+    %3 = arith.extui %arg1: i8 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3x3xi32>
+  return %2: tensor<3x3xi32>
+}
+
+func.func private @printMemrefI32(tensor<*xi32>) attributes { llvm.emit_c_interface }
 func.func @test(%arg0: tensor<3x3xi8>, %arg1: tensor<3x3xi8>, %arg2: tensor<3x3xi8>) -> tensor<3x3xi8> {
     %c0_i8 = arith.constant 0 : i8
     %0 = tensor.empty() : tensor<3x3xi8>
diff --git a/test/PlaidML/OpTest.GEMV_INT8.mlir b/test/PlaidML/OpTest.GEMV_INT8.mlir
@@ -17,12 +17,26 @@ func.func @main() {
     %1= arith.constant dense<[1, 1, 1]>:tensor<3xi8>
     %2= arith.constant dense<[1, 1, 1]>:tensor<3xi8>
     %3 = call @test(%0,%1,%2) : (tensor<3x3xi8>,tensor<3xi8>,tensor<3xi8>) -> tensor<3xi8>
-    %unranked = tensor.cast %3 : tensor<3xi8>to tensor<*xi8>
-    call @printMemrefI8(%unranked) : (tensor<*xi8>) -> ()
-    // CHECK:
+    %4 = call @castI8toI32(%3): (tensor<3xi8>) -> tensor<3xi32>
+    %unranked = tensor.cast %4 : tensor<3xi32>to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
+    // CHECK: Unranked Memref base@ = {{(0x)?[-9a-f]*}}
+    // CHECK-NEXT: [7,  4,  4]
     return
 }
-func.func private @printMemrefI8(tensor<*xi8>)
+func.func @castI8toI32(%arg0: tensor<3xi8>) -> tensor<3xi32> {
+  %1 = tensor.empty() : tensor<3xi32>
+  %2 = linalg.generic {indexing_maps = [#map3, #map3], iterator_types = ["parallel"]}
+       ins(%arg0: tensor<3xi8>)
+       outs(%1 : tensor<3xi32>)
+       attrs =  {iterator_ranges = [3]} {
+  ^bb0(%arg1: i8, %arg2: i32):
+    %3 = arith.extui %arg1: i8 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3xi32>
+  return %2: tensor<3xi32>
+}
+func.func private @printMemrefI32(tensor<*xi32>) attributes { llvm.emit_c_interface }
 func.func @test(%arg0: tensor<3x3xi8>, %arg1: tensor<3xi8>, %arg2: tensor<3xi8>) -> tensor<3xi8> {
     %c0_i8 = arith.constant 0 : i8
     %0 = tensor.empty() : tensor<3xi8>
diff --git a/test/PlaidML/OpTest.LogicalAnd_mixed.mlir b/test/PlaidML/OpTest.LogicalAnd_mixed.mlir
@@ -12,11 +12,26 @@ func.func @main() {
     %0= arith.constant dense<[[1, 2, 3], [4, 0, 6], [7, 0, 9]]>:tensor<3x3xi64>
     %1= arith.constant dense<[[10.0, 11.0, 12.0], [13.0, 14.0, 15.0], [16.0, 17.0, 18.0]]>:tensor<3x3xf32>
     %2 = call @test(%0,%1) : (tensor<3x3xi64>,tensor<3x3xf32>) -> tensor<3x3xi1>
-    %unranked = tensor.cast %2 : tensor<3x3xi1>to tensor<*xi1>
-    call @printMemrefI32(%unranked) : (tensor<*xi1>) -> ()
+    %3 = call @castI1toI32(%2): (tensor<3x3xi1>) -> tensor<3x3xi32>
+    %unranked = tensor.cast %3 : tensor<3x3xi32>to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
     return
 }
-func.func private @printMemrefI32(tensor<*xi1>)
+
+func.func @castI1toI32(%arg0: tensor<3x3xi1>) -> tensor<3x3xi32> {
+  %1 = tensor.empty() : tensor<3x3xi32>
+  %2 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]}
+       ins(%arg0: tensor<3x3xi1>)
+       outs(%1 : tensor<3x3xi32>)
+       attrs =  {iterator_ranges = [3, 3]} {
+  ^bb0(%arg1: i1, %arg2: i32):
+    %3 = arith.extui %arg1: i1 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3x3xi32>
+  return %2: tensor<3x3xi32>
+}
+
+func.func private @printMemrefI32(tensor<*xi32>)
 func.func @test(%arg0: tensor<3x3xi64>, %arg1: tensor<3x3xf32>)->tensor<3x3xi1>{
     %0 = tensor.empty() : tensor<3x3xi1>
     %1 = linalg.generic {indexing_maps = [#map, #map, #map], iterator_types = ["parallel", "parallel"]} ins(%arg0, %arg1 : tensor<3x3xi64>, tensor<3x3xf32>) outs(%0 : tensor<3x3xi1>) {
diff --git a/test/PlaidML/OpTest.LogicalAnd_uint64.mlir b/test/PlaidML/OpTest.LogicalAnd_uint64.mlir
@@ -12,11 +12,26 @@ func.func @main() {
     %0= arith.constant dense<[[1, 2, 3], [4, 0, 6], [7, 0, 9]]>:tensor<3x3xi64>
     %1= arith.constant dense<[[10, 11, 12], [13, 14, 15], [16, 17, 18]]>:tensor<3x3xi64>
     %2 = call @test(%0,%1) : (tensor<3x3xi64>,tensor<3x3xi64>) -> tensor<3x3xi1>
-    %unranked = tensor.cast %2 : tensor<3x3xi1>to tensor<*xi1>
-    call @printMemrefI32(%unranked) : (tensor<*xi1>) -> ()
+    %3 = call @castI1toI32(%2): (tensor<3x3xi1>) -> tensor<3x3xi32>
+    %unranked = tensor.cast %3 : tensor<3x3xi32>to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
     return
 }
-func.func private @printMemrefI32(tensor<*xi1>)
+
+func.func @castI1toI32(%arg0: tensor<3x3xi1>) -> tensor<3x3xi32> {
+  %1 = tensor.empty() : tensor<3x3xi32>
+  %2 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]}
+       ins(%arg0: tensor<3x3xi1>)
+       outs(%1 : tensor<3x3xi32>)
+       attrs =  {iterator_ranges = [3, 3]} {
+  ^bb0(%arg1: i1, %arg2: i32):
+    %3 = arith.extui %arg1: i1 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3x3xi32>
+  return %2: tensor<3x3xi32>
+}
+
+func.func private @printMemrefI32(tensor<*xi32>)
 func.func @test(%arg0: tensor<3x3xi64>, %arg1: tensor<3x3xi64>)->tensor<3x3xi1>{
     %0 = tensor.empty() : tensor<3x3xi1>
     %1 = linalg.generic {indexing_maps = [#map, #map, #map], iterator_types = ["parallel", "parallel"]} ins(%arg0, %arg1 : tensor<3x3xi64>, tensor<3x3xi64>) outs(%0 : tensor<3x3xi1>) {
diff --git a/test/PlaidML/OpTest.LogicalNot_float.mlir b/test/PlaidML/OpTest.LogicalNot_float.mlir
@@ -11,11 +11,26 @@ module @logical_not {
 func.func @main() {
     %0= arith.constant dense<[[1.0, 2.0, 3.0], [4.0, 0.0, 6.5], [7.7, 0.0, 0.9]]>:tensor<3x3xf32>
     %1 = call @test(%0) : (tensor<3x3xf32>) -> tensor<3x3xi1>
-    %unranked = tensor.cast %1 : tensor<3x3xi1>to tensor<*xi1>
-    call @printMemrefI32(%unranked) : (tensor<*xi1>) -> ()
+    %2 = call @castI1toI32(%1): (tensor<3x3xi1>) -> tensor<3x3xi32>
+    %unranked = tensor.cast %2 : tensor<3x3xi32>to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
     return
 }
-func.func private @printMemrefI32(tensor<*xi1>)
+
+func.func @castI1toI32(%arg0: tensor<3x3xi1>) -> tensor<3x3xi32> {
+  %1 = tensor.empty() : tensor<3x3xi32>
+  %2 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]}
+       ins(%arg0: tensor<3x3xi1>)
+       outs(%1 : tensor<3x3xi32>)
+       attrs =  {iterator_ranges = [3, 3]} {
+  ^bb0(%arg1: i1, %arg2: i32):
+    %3 = arith.extui %arg1: i1 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3x3xi32>
+  return %2: tensor<3x3xi32>
+}
+
+func.func private @printMemrefI32(tensor<*xi32>)
 func.func @test(%arg0: tensor<3x3xf32>)->tensor<3x3xi1>{
     %0 = tensor.empty() : tensor<3x3xi1>
     %1 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]} ins(%arg0 : tensor<3x3xf32>) outs(%0 : tensor<3x3xi1>) {
diff --git a/test/PlaidML/OpTest.LogicalNot_int32.mlir b/test/PlaidML/OpTest.LogicalNot_int32.mlir
@@ -11,11 +11,26 @@ module @logical_not {
 func.func @main() {
     %0= arith.constant dense<[[1, 2, 3], [4, 0, 6], [7, 0, 9]]>:tensor<3x3xi32>
     %1 = call @test(%0) : (tensor<3x3xi32>) -> tensor<3x3xi1>
-    %unranked = tensor.cast %1 : tensor<3x3xi1>to tensor<*xi1>
-    call @printMemrefI32(%unranked) : (tensor<*xi1>) -> ()
+    %2 = call @castI1toI32(%1): (tensor<3x3xi1>) -> tensor<3x3xi32>
+    %unranked = tensor.cast %2 : tensor<3x3xi32>to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
     return
 }
-func.func private @printMemrefI32(tensor<*xi1>)
+
+func.func @castI1toI32(%arg0: tensor<3x3xi1>) -> tensor<3x3xi32> {
+  %1 = tensor.empty() : tensor<3x3xi32>
+  %2 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]}
+       ins(%arg0: tensor<3x3xi1>)
+       outs(%1 : tensor<3x3xi32>)
+       attrs =  {iterator_ranges = [3, 3]} {
+  ^bb0(%arg1: i1, %arg2: i32):
+    %3 = arith.extui %arg1: i1 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3x3xi32>
+  return %2: tensor<3x3xi32>
+}
+
+func.func private @printMemrefI32(tensor<*xi32>)
 func.func @test(%arg0: tensor<3x3xi32>)->tensor<3x3xi1>{
     %0 = tensor.empty() : tensor<3x3xi1>
     %1 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]} ins(%arg0 : tensor<3x3xi32>) outs(%0 : tensor<3x3xi1>) {
diff --git a/test/PlaidML/OpTest.LogicalOr_float.mlir b/test/PlaidML/OpTest.LogicalOr_float.mlir
@@ -12,11 +12,26 @@ func.func @main() {
     %0= arith.constant dense<[[1.0, 2.0, 3.0], [4.0, 0.0, 6.0], [7.0, 0.0, 9.0]]>:tensor<3x3xf32>
     %1= arith.constant dense<[[10.0, 11.0, 12.0], [0.0, 0.0, 0.0], [16.0, 17.0, 18.0]]>:tensor<3x3xf32>
     %2 = call @test(%0,%1) : (tensor<3x3xf32>,tensor<3x3xf32>) -> tensor<3x3xi1>
-    %unranked = tensor.cast %2 : tensor<3x3xi1>to tensor<*xi1>
-    call @printMemrefI32(%unranked) : (tensor<*xi1>) -> ()
+    %3 = call @castI1toI32(%2): (tensor<3x3xi1>) -> tensor<3x3xi32>
+    %unranked = tensor.cast %3 : tensor<3x3xi32>to tensor<*xi32>
+    call @printMemrefI32(%unranked) : (tensor<*xi32>) -> ()
     return
 }
-func.func private @printMemrefI32(tensor<*xi1>)
+
+func.func @castI1toI32(%arg0: tensor<3x3xi1>) -> tensor<3x3xi32> {
+  %1 = tensor.empty() : tensor<3x3xi32>
+  %2 = linalg.generic {indexing_maps = [#map, #map], iterator_types = ["parallel", "parallel"]}
+       ins(%arg0: tensor<3x3xi1>)
+       outs(%1 : tensor<3x3xi32>)
+       attrs =  {iterator_ranges = [3, 3]} {
+  ^bb0(%arg1: i1, %arg2: i32):
+    %3 = arith.extui %arg1: i1 to i32
+    linalg.yield %3 : i32
+  } -> tensor<3x3xi32>
+  return %2: tensor<3x3xi32>
+}
+
+func.func private @printMemrefI32(tensor<*xi32>)
 func.func @test(%arg0: tensor<3x3xf32>, %arg1: tensor<3x3xf32>)->tensor<3x3xi1>{
     %0 = tensor.empty() : tensor<3x3xi1>
     %1 = linalg.generic {indexing_maps = [#map, #map, #map], iterator_types = ["parallel", "parallel"]} ins(%arg0, %arg1 : tensor<3x3xf32>, tensor<3x3xf32>) outs(%0 : tensor<3x3xi1>) {
diff --git a/test/PlaidML/OpTest.LogicalOr_int32.mlir b/test/PlaidML/OpTest.LogicalOr_int32.mlir
diff --git a/test/PlaidML/OpTest.LogicalOr_uint64.mlir b/test/PlaidML/OpTest.LogicalOr_uint64.mlir
diff --git a/test/PlaidML/lit.local.cfg b/test/PlaidML/lit.local.cfg