Merge pull request #225 from NVIDIA/pytorch_update

narendasan · web-flow · commit 960d338f8f87 · 2020-12-14T14:24:04.000-07:00
Pytorch 1.7 update API changes
diff --git a/.bazelversion b/.bazelversion
@@ -1 +1 @@
-3.4.1
+3.7.0
diff --git a/README.md b/README.md
@@ -71,12 +71,13 @@ torch.jit.save(trt_ts_module, "trt_torchscript_module.ts")
 > Note: Refer NVIDIA NGC container(https://ngc.nvidia.com/catalog/containers/nvidia:l4t-pytorch) for PyTorch libraries on JetPack.
 
 ### Dependencies
+These are the following dependencies used to verify the testcases. TRTorch can work with other versions, but the tests are not guaranteed to pass.
 
-- Bazel 3.3.1
-- Libtorch 1.5.1
-- CUDA 10.2
-- cuDNN 7.6.5 (by default, cuDNN 8 supported with compatable PyTorch build)
-- TensorRT 7.0.0 (by default, TensorRT 7.1 supported with compatable PyTorch build)
+- Bazel 3.7.0
+- Libtorch 1.7.1 (built with CUDA 11.0)
+- CUDA 11.0
+- cuDNN 8
+- TensorRT 7.2.1.6
 
 ## Prebuilt Binaries and Wheel files
 
diff --git a/WORKSPACE b/WORKSPACE
@@ -35,7 +35,7 @@ git_repository(
 # CUDA should be installed on the system locally
 new_local_repository(
     name = "cuda",
-    path = "/usr/local/cuda-10.2/",
+    path = "/usr/local/cuda-11.0/",
     build_file = "@//third_party/cuda:BUILD",
 )
 
@@ -53,16 +53,16 @@ http_archive(
     name = "libtorch",
     build_file = "@//third_party/libtorch:BUILD",
     strip_prefix = "libtorch",
-    urls = ["https://download.pytorch.org/libtorch/cu102/libtorch-cxx11-abi-shared-with-deps-1.6.0.zip"],
-    sha256 = "fded948bd2dbee625cee33ebbd4843a69496729389e0200a90fbb667cdaeeb69"
+    sha256 = "117f6dd65b7267839197397edd0b10fd2900b0f291e3e54b0b800caefc31bcb6",
+    urls = ["https://download.pytorch.org/libtorch/cu110/libtorch-cxx11-abi-shared-with-deps-1.7.1%2Bcu110.zip"],
 )
 
 http_archive(
     name = "libtorch_pre_cxx11_abi",
     build_file = "@//third_party/libtorch:BUILD",
     strip_prefix = "libtorch",
-    sha256 = "141bb229f4bbf905541096cf8705785e7b0c79e37ca1e5db9d372730b1b9abd7",
-    urls = ["https://download.pytorch.org/libtorch/cu102/libtorch-shared-with-deps-1.6.0.zip"],
+    sha256 = "c77f926afd55d7e860ec9c7abc992c25be77c89771c3ec6fcc13ea42f07d46df",
+    urls = ["https://download.pytorch.org/libtorch/cu110/libtorch-shared-with-deps-1.7.1%2Bcu110.zip"],
 )
 
 # Download these tarballs manually from the NVIDIA website
@@ -71,18 +71,18 @@ http_archive(
 
 http_archive(
     name = "cudnn",
-    urls = ["https://developer.nvidia.com/compute/machine-learning/cudnn/secure/7.6.5.32/Production/10.2_20191118/cudnn-10.2-linux-x64-v7.6.5.32.tgz",],
+    urls = ["https://developer.nvidia.com/compute/machine-learning/cudnn/secure/8.0.5/11.0_20201106/cudnn-11.0-linux-x64-v8.0.5.39.tgz",],
     build_file = "@//third_party/cudnn/archive:BUILD",
-    sha256 = "600267f2caaed2fd58eb214ba669d8ea35f396a7d19b94822e6b36f9f7088c20",
+    sha256 = "4e16ee7895deb4a8b1c194b812ba49586ef7d26902051401d3717511898a9b73",
     strip_prefix = "cuda"
 )
 
 http_archive(
     name = "tensorrt",
-    urls = ["https://developer.nvidia.com/compute/machine-learning/tensorrt/secure/7.0/7.0.0.11/tars/TensorRT-7.0.0.11.Ubuntu-18.04.x86_64-gnu.cuda-10.2.cudnn7.6.tar.gz",],
+    urls = ["https://developer.nvidia.com/compute/machine-learning/tensorrt/secure/7.2.1/tars/TensorRT-7.2.1.6.Ubuntu-18.04.x86_64-gnu.cuda-11.0.cudnn8.0.tar.gz",],
     build_file = "@//third_party/tensorrt/archive:BUILD",
-    sha256 = "c7d73b2585b18aae68b740249efa8c8ba5ae852abe9a023720595432a8eb4efd",
-    strip_prefix = "TensorRT-7.0.0.11"
+    sha256 = "8def6b03b0c8c3751f560df21b3e99668ae05aab5140b1d38b8e51e4a0ffbbb8",
+    strip_prefix = "TensorRT-7.2.1.6"
 )
 
 ####################################################################################
@@ -146,5 +146,3 @@ pip3_import(
 
 load("@pylinter_deps//:requirements.bzl", "pip_install")
 pip_install()
-
-
diff --git a/core/conversion/InterfaceTypes.cpp b/core/conversion/InterfaceTypes.cpp
@@ -11,7 +11,7 @@ GraphParams get_named_params(c10::ArrayRef<torch::jit::Value*> inputs, std::vect
   GraphParams named_params;
   auto param_it = params.begin();
   for (auto in : inputs) {
-    if (in->type() != c10::TensorType::get() && in->isCompleteTensor() && param_it != params.end()) {
+    if (in->type() != c10::TensorType::get() && param_it != params.end()) {
       named_params[in] = *param_it;
       ++param_it;
     }
diff --git a/core/conversion/converters/impl/conv_deconv.cpp b/core/conversion/converters/impl/conv_deconv.cpp
@@ -9,82 +9,99 @@ namespace conversion {
 namespace converters {
 namespace impl {
 namespace {
-auto conv_registrations TRTORCH_UNUSED = RegisterNodeConversionPatterns().pattern({
-    R"SIG(aten::_convolution(Tensor input, Tensor weight,
-                                 Tensor? bias, int[] stride, int[] padding,
-                                 int[] dilation, bool transposed,
-                                 int[] output_padding, int groups, bool benchmark,
-                                 bool deterministic, bool cudnn_enabled) -> (Tensor))SIG",
-    [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
-      auto in = args[0].ITensor(); // assumes non-static input Tensor
-      auto w = Weights(ctx, args[1].unwrapToTensor());
-      auto stride = util::toDims(args[3].unwrapToIntList());
-      LOG_DEBUG("stride: " << stride);
-      auto padding = util::toDims(args[4].unwrapToIntList());
-      LOG_DEBUG("padding: " << padding);
-      auto dilation = util::toDims(args[5].unwrapToIntList());
-      LOG_DEBUG("dilation: " << dilation);
-      bool transposed = args[6].unwrapToBool();
-      auto out_padding = util::toDims(args[7].unwrapToIntList());
-      LOG_DEBUG("out_padding: " << out_padding);
-      int64_t groups = args[8].unwrapToInt();
-      LOG_DEBUG("groups: " << groups);
 
-      nvinfer1::ILayer* new_layer;
-      if (transposed) {
-        Weights bias;
-        if (args[2].IValue()->isTensor()) {
-          bias = Weights(ctx, args[2].unwrapToTensor());
-        } else {
-          bias = Weights(ctx, torch::zeros(args[1].unwrapToTensor().sizes()[1] * groups));
-        }
+bool add_conv_deconv(ConversionCtx* ctx, const torch::jit::Node* n, args& args) {
+  auto in = args[0].ITensor(); // assumes non-static input Tensor
+  auto w = Weights(ctx, args[1].unwrapToTensor());
+  auto stride = util::toDims(args[3].unwrapToIntList());
+  LOG_DEBUG("stride: " << stride);
+  auto padding = util::toDims(args[4].unwrapToIntList());
+  LOG_DEBUG("padding: " << padding);
+  auto dilation = util::toDims(args[5].unwrapToIntList());
+  LOG_DEBUG("dilation: " << dilation);
+  bool transposed = args[6].unwrapToBool();
+  auto out_padding = util::toDims(args[7].unwrapToIntList());
+  LOG_DEBUG("out_padding: " << out_padding);
+  int64_t groups = args[8].unwrapToInt();
+  LOG_DEBUG("groups: " << groups);
+
+  nvinfer1::ILayer* new_layer;
+  if (transposed) {
+    Weights bias;
+    if (args[2].IValue()->isTensor()) {
+      bias = Weights(ctx, args[2].unwrapToTensor());
+    } else {
+      bias = Weights(ctx, torch::zeros(args[1].unwrapToTensor().sizes()[1] * groups));
+    }
 
-        // shape of deconvolution's weight: [in, out/groups, ...]
-        auto deconv = ctx->net->addDeconvolutionNd(
-            *in, args[1].unwrapToTensor().sizes()[1] * groups, w.kernel_shape, w.data, bias.data);
-        TRTORCH_CHECK(deconv, "Unable to create deconvolution layer from node: " << *n);
+    // shape of deconvolution's weight: [in, out/groups, ...]
+    auto deconv = ctx->net->addDeconvolutionNd(
+        *in, args[1].unwrapToTensor().sizes()[1] * groups, w.kernel_shape, w.data, bias.data);
+    TRTORCH_CHECK(deconv, "Unable to create deconvolution layer from node: " << *n);
 
-        deconv->setStrideNd(stride);
-        deconv->setPaddingNd(padding);
-#if NV_TENSORRT_MAJOR > 7 || (NV_TENSORRT_MAJOR == 7 && NV_TENSORRT_MINOR == 1)
-        deconv->setDilationNd(dilation);
-        deconv->setNbGroups(groups);
+    deconv->setStrideNd(stride);
+    deconv->setPaddingNd(padding);
+#if NV_TENSORRT_MAJOR > 7 || (NV_TENSORRT_MAJOR == 7 && NV_TENSORRT_MINOR >= 1)
+    deconv->setDilationNd(dilation);
+    deconv->setNbGroups(groups);
 #else
-        TRTORCH_CHECK(groups == 1, "for deconv with groups > 1, require TensorRT version >= 7.1");
-        for (auto it = dilation.begin(); it != dilation.end(); ++it) {
-          TRTORCH_CHECK(*it == 1, "for deconv with dilation > 1, require TensorRT version >= 7.1");
-        }
+    TRTORCH_CHECK(groups == 1, "for deconv with groups > 1, require TensorRT version >= 7.1");
+    for (int idx = 0; idx < dilation.nbDims; idx++) {
+      TRTORCH_CHECK(dilation.d[idx] == 1, "for deconv with dilation > 1, require TensorRT version >= 7.1");
+    }
 #endif
-        new_layer = deconv;
-      } else {
-        Weights bias;
-        if (args[2].IValue()->isTensor()) {
-          bias = Weights(ctx, args[2].unwrapToTensor());
-        } else {
-          bias = Weights(ctx, torch::zeros(args[1].unwrapToTensor().sizes()[0]));
-        }
+    new_layer = deconv;
+  } else {
+    Weights bias;
+    if (args[2].IValue()->isTensor()) {
+      bias = Weights(ctx, args[2].unwrapToTensor());
+    } else {
+      bias = Weights(ctx, torch::zeros(args[1].unwrapToTensor().sizes()[0]));
+    }
 
-        // shape of convolution's weight: [out, in/groups, ...]
-        auto conv =
-            ctx->net->addConvolutionNd(*in, args[1].unwrapToTensor().sizes()[0], w.kernel_shape, w.data, bias.data);
-        TRTORCH_CHECK(conv, "Unable to create convolution layer from node: " << *n);
+    // shape of convolution's weight: [out, in/groups, ...]
+    auto conv = ctx->net->addConvolutionNd(*in, args[1].unwrapToTensor().sizes()[0], w.kernel_shape, w.data, bias.data);
+    TRTORCH_CHECK(conv, "Unable to create convolution layer from node: " << *n);
 
-        conv->setStrideNd(stride);
-        conv->setPaddingMode(nvinfer1::PaddingMode::kCAFFE_ROUND_DOWN);
-        conv->setPaddingNd(padding);
-        conv->setPostPadding(out_padding);
-        conv->setDilationNd(dilation);
-        conv->setNbGroups(groups);
-        new_layer = conv;
-      }
-      new_layer->setName(util::node_info(n).c_str());
+    conv->setStrideNd(stride);
+    conv->setPaddingMode(nvinfer1::PaddingMode::kCAFFE_ROUND_DOWN);
+    conv->setPaddingNd(padding);
+    conv->setPostPadding(out_padding);
+    conv->setDilationNd(dilation);
+    conv->setNbGroups(groups);
+    new_layer = conv;
+  }
+  new_layer->setName(util::node_info(n).c_str());
 
-      auto out = ctx->AssociateValueAndTensor(n->outputs()[0], new_layer->getOutput(0));
+  auto out = ctx->AssociateValueAndTensor(n->outputs()[0], new_layer->getOutput(0));
 
-      LOG_DEBUG("Output tensor shape: " << out->getDimensions());
+  LOG_DEBUG("Output tensor shape: " << out->getDimensions());
 
-      return true;
-    }});
+  return true;
+}
+
+auto conv_registrations TRTORCH_UNUSED = RegisterNodeConversionPatterns()
+                                             .pattern({
+                                                 R"SIG(aten::_convolution(Tensor input, Tensor weight,
+                                 Tensor? bias, int[] stride, int[] padding,
+                                 int[] dilation, bool transposed,
+                                 int[] output_padding, int groups, bool benchmark,
+                                 bool deterministic, bool cudnn_enabled, bool allow_tf32) -> (Tensor))SIG",
+                                                 [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                                                   return add_conv_deconv(ctx, n, args);
+                                                 }})
+                                             .pattern({
+                                                 R"SIG(aten::_convolution.deprecated(Tensor input, Tensor weight,
+                                     Tensor? bias, int[] stride, int[] padding,
+                                     int[] dilation, bool transposed,
+                                     int[] output_padding, int groups, bool benchmark,
+                                     bool deterministic, bool cudnn_enabled) -> (Tensor))SIG",
+                                                 [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
+                                                   // This pattern is only matched for traced JIT models which do not
+                                                   // have allow_tf32 bool in the function signature. The TRT conversion
+                                                   // code is exactly same as the above call.
+                                                   return add_conv_deconv(ctx, n, args);
+                                                 }});
 } // namespace
 } // namespace impl
 } // namespace converters
diff --git a/core/conversion/converters/impl/interpolate.cpp b/core/conversion/converters/impl/interpolate.cpp
@@ -77,7 +77,7 @@ void resize_layer_size(
 auto interpolate_registrations TRTORCH_UNUSED =
     RegisterNodeConversionPatterns()
         .pattern(
-            {"aten::upsample_nearest1d(Tensor self, int[1] output_size, float? scales=None) -> (Tensor)",
+            {"aten::upsample_nearest1d.vec(Tensor self, int[] output_size, float? scales=None) -> (Tensor)",
              [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
                auto in = args[0].ITensor();
                auto in_shape = util::toVec(in->getDimensions());
@@ -154,7 +154,7 @@ auto interpolate_registrations TRTORCH_UNUSED =
                return true;
              }})
         .pattern(
-            {"aten::upsample_linear1d(Tensor self, int[1] output_size, bool align_corners, float? scales=None) -> (Tensor)",
+            {"aten::upsample_linear1d.vec(Tensor self, int[] output_size, bool align_corners, float[]? scales) -> (Tensor)",
              [](ConversionCtx* ctx, const torch::jit::Node* n, args& args) -> bool {
                auto in = args[0].ITensor();
                auto in_shape = util::toVec(in->getDimensions());
diff --git a/core/lowering/lowering.cpp b/core/lowering/lowering.cpp
@@ -8,6 +8,7 @@
 #include "torch/csrc/jit/passes/lower_graph.h"
 #include "torch/csrc/jit/passes/lower_tuples.h"
 #include "torch/csrc/jit/passes/peephole.h"
+#include "torch/csrc/jit/passes/remove_mutation.h"
 
 #include "core/lowering/lowering.h"
 #include "core/lowering/passes/passes.h"
diff --git a/core/lowering/passes/conv2d_to_convolution.cpp b/core/lowering/passes/conv2d_to_convolution.cpp
@@ -16,7 +16,7 @@ void Conv2DToConvolution(std::shared_ptr<torch::jit::Graph>& graph) {
         graph(%x, %w, %b, %s, %p, %d, %g):
             %1 : bool = prim::Constant[value=0]()
             %2 : int[] = prim::Constant[value=[0, 0]]()
-            %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1)
+            %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1, %1)
             return (%4))IR";
   ;
 
diff --git a/core/lowering/passes/conv3d_to_convolution.cpp b/core/lowering/passes/conv3d_to_convolution.cpp
@@ -16,7 +16,7 @@ void Conv3DToConvolution(std::shared_ptr<torch::jit::Graph>& graph) {
         graph(%x, %w, %b, %s, %p, %d, %g):
             %1 : bool = prim::Constant[value=0]()
             %2 : int[] = prim::Constant[value=[0, 0, 0]]()
-            %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1)
+            %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1, %1)
             return (%4))IR";
   ;
 
diff --git a/core/lowering/register_trt_placeholder_ops.cpp b/core/lowering/register_trt_placeholder_ops.cpp
@@ -10,12 +10,7 @@ c10::AliasAnalysisKind aliasAnalysisFromSchema() {
 RegisterOperators trt_placeholder_ops_reg({
     /// Op marks a Tensor to be conveted from an Torch Tensor
     /// to a TRT constant Tensor
-    Operator(
-        "trt::const(Tensor val) -> Tensor",
-        [](Stack& stack) {
-          return 0; // noop
-        },
-        aliasAnalysisFromSchema()),
+    Operator("trt::const(Tensor val) -> Tensor", [](Stack* stack) {}, aliasAnalysisFromSchema()),
 });
 
 } // namespace jit
diff --git a/cpp/api/include/trtorch/macros.h b/cpp/api/include/trtorch/macros.h
@@ -20,7 +20,7 @@
 #define STR(x) XSTR(x)
 
 #define TRTORCH_MAJOR_VERSION 0
-#define TRTORCH_MINOR_VERSION 1
+#define TRTORCH_MINOR_VERSION 2
 #define TRTORCH_PATCH_VERSION 0
 #define TRTORCH_VERSION      \
   STR(TRTORCH_MAJOR_VERSION) \
diff --git a/py/requirements.txt b/py/requirements.txt
@@ -1 +1 @@
-torch==1.6.0
+torch==1.7.0
diff --git a/py/setup.py b/py/setup.py
@@ -16,7 +16,7 @@
 
 dir_path = os.path.dirname(os.path.realpath(__file__))
 
-__version__ = '0.1.0'
+__version__ = '0.2.0a0'
 
 CXX11_ABI = False
 
@@ -204,7 +204,7 @@ def run(self):
       long_description=long_description,
       ext_modules=ext_modules,
       install_requires=[
-          'torch==1.6.0',
+          'torch==1.7.1',
       ],
       setup_requires=[],
       cmdclass={
diff --git a/tests/core/converters/test_conv_deconv.cpp b/tests/core/converters/test_conv_deconv.cpp
diff --git a/tests/modules/hub.py b/tests/modules/hub.py
diff --git a/tests/py/requirements.txt b/tests/py/requirements.txt

Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@ GraphParams get_named_params(c10::ArrayRef<torch::jit::Value*> inputs, std::vect`
`11`	`11`	`GraphParams named_params;`
`12`	`12`	`auto param_it = params.begin();`
`13`	`13`	`for (auto in : inputs) {`
`14`		`- if (in->type() != c10::TensorType::get() && in->isCompleteTensor() && param_it != params.end()) {`
	`14`	`+ if (in->type() != c10::TensorType::get() && param_it != params.end()) {`
`15`	`15`	`named_params[in] = *param_it;`
`16`	`16`	`++param_it;`
`17`	`17`	`}`
Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@ void Conv2DToConvolution(std::shared_ptr<torch::jit::Graph>& graph) {`
`16`	`16`	`graph(%x, %w, %b, %s, %p, %d, %g):`
`17`	`17`	`%1 : bool = prim::Constant[value=0]()`
`18`	`18`	`%2 : int[] = prim::Constant[value=[0, 0]]()`
`19`		`- %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1)`
	`19`	`+ %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1, %1)`
`20`	`20`	`return (%4))IR";`
`21`	`21`	`;`
`22`	`22`
Original file line number	Diff line number	Diff line change
`@@ -16,7 +16,7 @@ void Conv3DToConvolution(std::shared_ptr<torch::jit::Graph>& graph) {`
`16`	`16`	`graph(%x, %w, %b, %s, %p, %d, %g):`
`17`	`17`	`%1 : bool = prim::Constant[value=0]()`
`18`	`18`	`%2 : int[] = prim::Constant[value=[0, 0, 0]]()`
`19`		`- %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1)`
	`19`	`+ %4 : Tensor = aten::_convolution(%x, %w, %b, %s, %p, %d, %1, %2, %g, %1, %1, %1, %1)`
`20`	`20`	`return (%4))IR";`
`21`	`21`	`;`
`22`	`22`