Merge pull request #315 from guoruoqian/expandDynamic

narendasan · web-flow · commit 37305c0d9c2c · 2021-02-23T15:15:43.000-07:00
Support dynamic input in expand layer, expand_as layer and repeat layer
diff --git a/core/conversion/converters/impl/expand.cpp b/core/conversion/converters/impl/expand.cpp
@@ -15,6 +15,18 @@ namespace converters {
 namespace impl {
 namespace {
 
+nvinfer1::ITensor* concat(int max_rank, int old_rank, ConversionCtx* ctx, nvinfer1::ITensor* tensor) {
+  if (max_rank - old_rank > 0) {
+    torch::Tensor thOne = torch::tensor(std::vector<int32_t>(max_rank - old_rank, 1), torch::kInt32);
+    auto one_tensor = tensor_to_const(ctx, thOne);
+    auto in_shape_tensor = ctx->net->addShape(*tensor)->getOutput(0);
+    nvinfer1::ITensor* const args[2] = {one_tensor, in_shape_tensor};
+    return ctx->net->addConcatenation(args, 2)->getOutput(0);
+  } else { // max_rank - old_rank == 0
+    return ctx->net->addShape(*tensor)->getOutput(0);
+  }
+}
+
 bool add_expand(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor* in, nvinfer1::Dims expandedDims) {
   auto input_dims = in->getDimensions();
   TRTORCH_CHECK(
@@ -27,12 +39,26 @@ bool add_expand(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor
     int64_t dim = input_dims.nbDims - 1 - offset;
     int64_t size = (dim >= 0) ? input_dims.d[dim] : 1;
     int64_t targetSize = expandedDims.d[i];
-    if (size != targetSize) {
-      if (size != 1) {
+    // In expand layer passing -1 as the size for a dimension means not changing the size of that dimension.
+    if (targetSize != -1) {
+      if (size != targetSize) {
+        if (size != 1) {
+          TRTORCH_THROW_ERROR(
+              "The expanded size of tensor (" << targetSize << ")"
+                                              << " must match the existing size (" << size << ")"
+                                              << " at dimension " << i);
+        }
+      }
+    } else {
+      // For the new dimensions, the size cannot be set to -1. Eg: an input of [3, 1] can be expanded to [3, -1, 4] but
+      // not [-1, 3, 4].
+      if (dim < 0) {
         TRTORCH_THROW_ERROR(
-            "The expanded size of tensor (" << targetSize << ")"
-                                            << " must match the existing size (" << size << ")"
-                                            << " at dimension " << i);
+            "The expanded size of the tensor (" << targetSize << ") isn't allowed in a leading, non-existing dimension "
+                                                << i);
+      } else {
+        // in(3, 1), expand(3, -1, 4) -> expand(3, 3, 4)
+        expandedDims.d[i] = input_dims.d[dim];
       }
     }
   }
@@ -76,77 +102,192 @@ bool add_expand(ConversionCtx* ctx, const torch::jit::Node* n, nvinfer1::ITensor
   return true;
 }
 
+bool add_expand_dynamic(
+    ConversionCtx* ctx,
+    const torch::jit::Node* n,
+    nvinfer1::ITensor* in,
+    nvinfer1::ITensor* expandedDimsTensor,
+    nvinfer1::Dims expandedDims,
+    bool is_expand_layer) {
+  auto input_dims = in->getDimensions();
+  auto input_rank = in->getDimensions().nbDims;
+  auto output_rank = expandedDims.nbDims;
+  TRTORCH_CHECK(
+      input_rank <= output_rank,
+      "Number of dimensions of the desired expansion must be greater than or equal to the number of input dimensions");
+
+  /* TODO: When the inputs are dynamic, some dimensions of the inputs are indeterminate before setBindingDimensions. For
+     these indeterminate dimensions, we don't validate the expansion. Eg: For an input of [3, -1], we omit the
+     validation of the second dimension. Need to explore a better way to validate the expansion.
+  */
+  // Validate the expansion. Eg: an input of [3, 1] can be expanded to [1, 3, 4] but not [3, 4, 1]
+  for (int64_t i = expandedDims.nbDims - 1; i >= 0; --i) {
+    int64_t offset = expandedDims.nbDims - 1 - i;
+    int64_t dim = input_dims.nbDims - 1 - offset;
+    int64_t size = (dim >= 0) ? input_dims.d[dim] : 1;
+    int64_t targetSize = expandedDims.d[i];
+    // Passing -1 as the size for a dimension means not changing the size of that dimension in expand layer.
+    if (targetSize != -1) {
+      if (size != targetSize) {
+        // if size == -1, we can't validate the expansion before setBindingDimensions.
+        if (!(size == -1 || size == 1)) {
+          TRTORCH_THROW_ERROR(
+              "The expanded size of tensor (" << targetSize << ")"
+                                              << " must match the existing size (" << size << ")"
+                                              << " at dimension " << i);
+        }
+      }
+    } else {
+      // In dynamic expand layer, for the new dimensions, the size cannot be set to -1. Eg: an input of [3, 1] can be
+      // expanded to [3, -1, 4] but not [-1, 3, 4].
+      if (is_expand_layer && dim < 0) {
+        TRTORCH_THROW_ERROR(
+            "The expanded size of the tensor (" << targetSize << ") isn't allowed in a leading, non-existing dimension "
+                                                << i);
+      }
+    }
+  }
+
+  size_t max_rank = std::max(input_rank, output_rank);
+
+  // Dimensions are right alignment. Eg: an input of [3, 1] and max_rank = 4, the result of concat is [1, 1, 3, 1]
+  auto new_input_shape_tensor = concat(max_rank, input_rank, ctx, in);
+  auto new_output_shape_tensor = expandedDimsTensor;
+
+  // Add a reshape layer to expand dims
+  auto shuffle = ctx->net->addShuffle(*in);
+  shuffle->setInput(1, *new_input_shape_tensor);
+
+  // Start the slicing from beginning of tensor since this is an expand layer
+  std::vector<int64_t> start_vec(max_rank, 0);
+  nvinfer1::Dims starts_dim = util::toDims(c10::IntArrayRef(start_vec));
+  at::Tensor thStart = torch::tensor(util::toVec(starts_dim), torch::kInt32);
+  auto starts = tensor_to_const(ctx, thStart);
+
+  // compute sizes = max(x,y).
+  auto sizes =
+      ctx->net->addElementWise(*new_input_shape_tensor, *new_output_shape_tensor, nvinfer1::ElementWiseOperation::kMAX)
+          ->getOutput(0);
+  nvinfer1::Dims sizes_dim{-1, {}};
+  sizes_dim.nbDims = max_rank;
+
+  // Compute (x > 1 ? 1 : 0) for x in newDims, assuming positive x, using only TensorRT operations.
+  // min(1, sub(input_shape, 1))
+  torch::Tensor thOne = torch::tensor({1}, torch::kInt32);
+  auto one_tensor = tensor_to_const(ctx, thOne);
+  auto x_sub_one = ctx->net->addElementWise(*new_input_shape_tensor, *one_tensor, nvinfer1::ElementWiseOperation::kSUB)
+                       ->getOutput(0);
+  auto strides = ctx->net->addElementWise(*one_tensor, *x_sub_one, nvinfer1::ElementWiseOperation::kMIN)->getOutput(0);
+  nvinfer1::Dims strides_dim{-1, {}};
+  strides_dim.nbDims = max_rank;
+
+  // Slice layer does the expansion in TRT. Desired output size is specified by sizes input at index 2.
+  auto slice = ctx->net->addSlice(*shuffle->getOutput(0), starts_dim, sizes_dim, strides_dim);
+  slice->setInput(1, *starts);
+  slice->setInput(2, *sizes);
+  slice->setInput(3, *strides);
+
+  auto out_tensor = ctx->AssociateValueAndTensor(n->outputs()[0], slice->getOutput(0));
+
+  LOG_DEBUG("Expand layer output tensor shape: " << out_tensor->getDimensions());
+
+  return true;
+}
+
 auto expand_registrations TRTORCH_UNUSED =
     RegisterNodeConversionPatterns()
-        .pattern({"aten::expand(Tensor(a) self, int[] size, *, bool implicit=False) -> (Tensor(a))",
-                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
-                    auto in = args[0].ITensor();
-                    auto input_dims = in->getDimensions();
-                    auto expanded_size = args[1].unwrapToIntList();
-                    auto expandedDims = util::toDims(expanded_size);
-                    LOG_DEBUG("(expand layer) Expand input from " << input_dims << " to " << expandedDims);
-                    return add_expand(ctx, n, in, expandedDims);
-                  }})
-        .pattern({"aten::expand_as(Tensor(a) self, Tensor other) -> (Tensor(a))",
-                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
-                    // TODO: Currently expand supports static shapes. Need to explore if the same code can be extended
-                    // to dynamic expansion.
-                    auto in = args[0].ITensor();
-                    auto input_dims = in->getDimensions();
-                    auto targetTensor = args[1].ITensor();
-                    auto targetDims = targetTensor->getDimensions();
-                    LOG_DEBUG("(expand_as layer) Expand input from " << input_dims << " to " << targetDims);
-                    return add_expand(ctx, n, in, targetDims);
-                  }})
-        .pattern({"aten::repeat(Tensor self, int[] repeats) -> (Tensor)",
-                  [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
-                    auto in = args[0].ITensor();
-                    auto input_dims = in->getDimensions();
-                    auto repeats = args[1].unwrapToIntList().vec();
-                    TRTORCH_CHECK(
-                        static_cast<int64_t>(repeats.size()) >= input_dims.nbDims,
-                        "Number of repeat dimensions cannot be smaller than number of input dimensions");
-                    auto num_expand_dims = repeats.size() - input_dims.nbDims;
-                    if (num_expand_dims > 0) {
-                      nvinfer1::Dims reshape_dims;
-                      reshape_dims.nbDims = repeats.size();
-                      for (size_t i = 0; i < num_expand_dims; i++) {
-                        reshape_dims.d[i] = 1;
-                      }
-                      for (int64_t i = 0; i < input_dims.nbDims; i++) {
-                        reshape_dims.d[num_expand_dims + i] = input_dims.d[i];
-                      }
-                      // Add a reshape layer to expand dims
-                      auto reshape_layer = ctx->net->addShuffle(*in);
-                      reshape_layer->setReshapeDimensions(reshape_dims);
-                      in = reshape_layer->getOutput(0);
-                      LOG_DEBUG("Input reshaped to : " << in->getDimensions() << " from " << input_dims);
-                    }
-
-                    LOG_DEBUG("Repeats: " << repeats);
-
-                    // Concat across all repeat axes.
-                    // TODO: Implementation might not be performant. Explore other strategies to improve performance.
-                    for (int64_t i = repeats.size() - 1; i >= 0; --i) {
-                      std::vector<nvinfer1::ITensor*> tensors_vec;
-                      for (int64_t j = 0; j < repeats[i]; j++) {
-                        tensors_vec.push_back(in);
-                      }
-                      auto concat_layer = ctx->net->addConcatenation(tensors_vec.data(), tensors_vec.size());
-                      concat_layer->setAxis(i);
-                      in = concat_layer->getOutput(0);
-                    }
-
-                    auto out = ctx->AssociateValueAndTensor(n->outputs()[0], in);
-
-                    LOG_DEBUG("Repeat layer output tensor shape: " << out->getDimensions());
-
-                    return true;
-                  }});
+        .pattern(
+            {"aten::expand(Tensor(a) self, int[] size, *, bool implicit=False) -> (Tensor(a))",
+             [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+               auto in = args[0].ITensor();
+               auto input_dims = in->getDimensions();
+               auto expanded_size = args[1].unwrapToIntList();
+               auto expandedDims = util::toDims(expanded_size);
+               LOG_DEBUG("(expand layer) Expand input from " << input_dims << " to " << expandedDims);
+               if (ctx->input_is_dynamic) {
+                 at::Tensor thExpanded_size = torch::tensor(expanded_size.vec(), torch::kInt32);
+                 auto expandedDimsTensor = tensor_to_const(ctx, thExpanded_size);
+                 return add_expand_dynamic(ctx, n, in, expandedDimsTensor, expandedDims, true);
+               } else {
+                 return add_expand(ctx, n, in, expandedDims);
+               }
+             }})
+        .pattern(
+            {"aten::expand_as(Tensor(a) self, Tensor other) -> (Tensor(a))",
+             [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+               auto in = args[0].ITensor();
+               auto input_dims = in->getDimensions();
+               auto targetTensor = args[1].ITensor();
+               auto targetDims = targetTensor->getDimensions();
+               LOG_DEBUG("(expand_as layer) Expand input from " << input_dims << " to " << targetDims);
+               if (ctx->input_is_dynamic) {
+                 return add_expand_dynamic(
+                     ctx, n, in, ctx->net->addShape(*targetTensor)->getOutput(0), targetDims, false);
+               } else {
+                 return add_expand(ctx, n, in, targetDims);
+               }
+             }})
+        .pattern(
+            {"aten::repeat(Tensor self, int[] repeats) -> (Tensor)",
+             [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+               auto in = args[0].ITensor();
+               auto input_dims = in->getDimensions();
+               auto repeats = args[1].unwrapToIntList().vec();
+               int repeats_rank = repeats.size();
+               TRTORCH_CHECK(
+                   repeats_rank >= input_dims.nbDims,
+                   "Number of repeat dimensions cannot be smaller than number of input dimensions");
+               auto num_expand_dims = repeats_rank - input_dims.nbDims;
+
+               if (ctx->input_is_dynamic) {
+                 int input_rank = input_dims.nbDims;
+                 int output_rank = repeats_rank;
+                 auto new_input_shape_tensor = concat(output_rank, input_rank, ctx, in);
+
+                 // Add a reshape layer to expand dims
+                 auto shuffle = ctx->net->addShuffle(*in);
+                 shuffle->setInput(1, *new_input_shape_tensor);
+                 in = shuffle->getOutput(0);
+               } else {
+                 if (num_expand_dims > 0) {
+                   nvinfer1::Dims reshape_dims;
+                   reshape_dims.nbDims = repeats.size();
+                   for (int i = 0; i < num_expand_dims; i++) {
+                     reshape_dims.d[i] = 1;
+                   }
+                   for (int i = 0; i < input_dims.nbDims; i++) {
+                     reshape_dims.d[num_expand_dims + i] = input_dims.d[i];
+                   }
+                   // Add a reshape layer to expand dims
+                   auto reshape_layer = ctx->net->addShuffle(*in);
+                   reshape_layer->setReshapeDimensions(reshape_dims);
+                   in = reshape_layer->getOutput(0);
+                   LOG_DEBUG("Input reshaped to : " << in->getDimensions() << " from " << input_dims);
+                 }
+                 LOG_DEBUG("Repeats: " << repeats);
+               }
+
+               // Concat across all repeat axes.
+               // TODO: Implementation might not be performant. Explore other strategies to improve performance.
+               for (int i = repeats.size() - 1; i >= 0; --i) {
+                 std::vector<nvinfer1::ITensor*> tensors_vec;
+                 for (int j = 0; j < repeats[i]; j++) {
+                   tensors_vec.push_back(in);
+                 }
+                 auto concat_layer = ctx->net->addConcatenation(tensors_vec.data(), tensors_vec.size());
+                 concat_layer->setAxis(i);
+                 in = concat_layer->getOutput(0);
+               }
+
+               auto out = ctx->AssociateValueAndTensor(n->outputs()[0], in);
+
+               LOG_DEBUG("Repeat layer output tensor shape: " << out->getDimensions());
+               return true;
+             }});
 
 } // namespace
 } // namespace impl
 } // namespace converters
 } // namespace conversion
 } // namespace core
-} // namespace trtorch
+} // namespace trtorch
diff --git a/core/util/BUILD b/core/util/BUILD
@@ -84,7 +84,6 @@ cc_library(
     })
 )
 
-
 load("@rules_pkg//:pkg.bzl", "pkg_tar")
 
 pkg_tar(
diff --git a/tests/core/conversion/converters/test_expand.cpp b/tests/core/conversion/converters/test_expand.cpp

Original file line number	Diff line number	Diff line change
`@@ -84,7 +84,6 @@ cc_library(`
`84`	`84`	`})`
`85`	`85`	`)`
`86`	`86`
`87`		`-`
`88`	`87`	`load("@rules_pkg//:pkg.bzl", "pkg_tar")`
`89`	`88`
`90`	`89`	`pkg_tar(`