Merge pull request #578 from borisfom/trt7_back

narendasan · web-flow · commit b91c2689a3d4 · 2021-08-20T14:03:24.000-06:00
Backwards compatibility for TRT 7.x
diff --git a/core/conversion/conversionctx/ConversionCtx.cpp b/core/conversion/conversionctx/ConversionCtx.cpp
@@ -54,11 +54,12 @@ ConversionCtx::ConversionCtx(BuilderSettings build_settings)
         cudaSetDevice(settings.device.gpu_id) == cudaSuccess, "Unable to set gpu id: " << settings.device.gpu_id);
   }
 
-  builder = nvinfer1::createInferBuilder(logger);
-  net = builder->createNetworkV2(1U << static_cast<uint32_t>(nvinfer1::NetworkDefinitionCreationFlag::kEXPLICIT_BATCH));
+  builder = make_trt(nvinfer1::createInferBuilder(logger));
+  net = make_trt(
+      builder->createNetworkV2(1U << static_cast<uint32_t>(nvinfer1::NetworkDefinitionCreationFlag::kEXPLICIT_BATCH)));
 
   LOG_DEBUG(build_settings);
-  cfg = builder->createBuilderConfig();
+  cfg = make_trt(builder->createBuilderConfig());
 
   for (auto p = settings.enabled_precisions.begin(); p != settings.enabled_precisions.end(); ++p) {
     switch (*p) {
@@ -91,11 +92,11 @@ ConversionCtx::ConversionCtx(BuilderSettings build_settings)
   if (settings.disable_tf32) {
     cfg->clearFlag(nvinfer1::BuilderFlag::kTF32);
   }
-
+#if NV_TENSORRT_MAJOR > 7
   if (settings.sparse_weights) {
     cfg->setFlag(nvinfer1::BuilderFlag::kSPARSE_WEIGHTS);
   }
-
+#endif
   if (settings.refit) {
     cfg->setFlag(nvinfer1::BuilderFlag::kREFIT);
   }
@@ -136,9 +137,6 @@ ConversionCtx::ConversionCtx(BuilderSettings build_settings)
 }
 
 ConversionCtx::~ConversionCtx() {
-  delete builder;
-  delete net;
-  delete cfg;
   for (auto ptr : builder_resources) {
     free(ptr);
   }
@@ -156,10 +154,19 @@ torch::jit::IValue* ConversionCtx::AssociateValueAndIValue(const torch::jit::Val
 }
 
 std::string ConversionCtx::SerializeEngine() {
+#if NV_TENSORRT_MAJOR > 7
   auto serialized_network = builder->buildSerializedNetwork(*net, *cfg);
   if (!serialized_network) {
     TRTORCH_THROW_ERROR("Building serialized network failed in TensorRT");
   }
+#else
+  auto engine = builder->buildEngineWithConfig(*net, *cfg);
+  if (!engine) {
+    TRTORCH_THROW_ERROR("Building TensorRT engine failed");
+  }
+  auto serialized_network = engine->serialize();
+  engine->destroy();
+#endif
   auto engine_str = std::string((const char*)serialized_network->data(), serialized_network->size());
   return engine_str;
 }
diff --git a/core/conversion/conversionctx/ConversionCtx.h b/core/conversion/conversionctx/ConversionCtx.h
@@ -32,7 +32,7 @@ struct BuilderSettings {
   bool strict_types = false;
   bool truncate_long_and_double = false;
   Device device;
-  nvinfer1::EngineCapability capability = nvinfer1::EngineCapability::kSTANDARD;
+  nvinfer1::EngineCapability capability = TRT_ENGINE_CAPABILITY_STANDARD;
   nvinfer1::IInt8Calibrator* calibrator = nullptr;
   uint64_t num_min_timing_iters = 2;
   uint64_t num_avg_timing_iters = 1;
@@ -56,9 +56,9 @@ struct ConversionCtx {
   uint64_t num_inputs = 0;
   uint64_t num_outputs = 0;
   bool input_is_dynamic = false;
-  nvinfer1::IBuilder* builder;
-  nvinfer1::INetworkDefinition* net;
-  nvinfer1::IBuilderConfig* cfg;
+  std::shared_ptr<nvinfer1::IBuilder> builder;
+  std::shared_ptr<nvinfer1::INetworkDefinition> net;
+  std::shared_ptr<nvinfer1::IBuilderConfig> cfg;
   std::set<nvinfer1::DataType> enabled_precisions;
   BuilderSettings settings;
   util::logging::TRTorchLogger logger;
diff --git a/core/conversion/converters/Weights.h b/core/conversion/converters/Weights.h
@@ -25,4 +25,4 @@ struct Weights {
 } // namespace converters
 } // namespace conversion
 } // namespace core
-} // namespace trtorch
+} // namespace trtorch
diff --git a/core/conversion/converters/impl/interpolate.cpp b/core/conversion/converters/impl/interpolate.cpp
@@ -108,10 +108,13 @@ void resize_layer_size(
 
   resize_layer->setResizeMode(mode);
   resize_layer->setName(util::node_info(n).c_str());
-
+#if NV_TENSORRT_MAJOR < 8
+  resize_layer->setAlignCorners(align_corners);
+#else
   if (align_corners) {
     resize_layer->setCoordinateTransformation(nvinfer1::ResizeCoordinateTransformation::kALIGN_CORNERS);
   }
+#endif
   auto layer_output = ctx->AssociateValueAndTensor(n->outputs()[0], resize_layer->getOutput(0));
 
   LOG_DEBUG("Output tensor shape: " << layer_output->getDimensions());
diff --git a/core/conversion/converters/impl/quantization.cpp b/core/conversion/converters/impl/quantization.cpp
@@ -9,6 +9,7 @@ namespace converters {
 namespace impl {
 namespace {
 
+#if NV_TENSORRT_MAJOR > 7
 // clang-format off
 auto quantization_registrations TRTORCH_UNUSED = RegisterNodeConversionPatterns()
   .pattern({"aten::fake_quantize_per_tensor_affine(Tensor self, float scale, int zero_point, int quant_min, int quant_max) -> (Tensor)",
@@ -53,6 +54,7 @@ auto quantization_registrations TRTORCH_UNUSED = RegisterNodeConversionPatterns(
               return true;
             }});
 // clang-format on
+#endif
 } // namespace
 } // namespace impl
 } // namespace converters
diff --git a/core/runtime/TRTEngine.cpp b/core/runtime/TRTEngine.cpp
@@ -43,15 +43,14 @@ TRTEngine::TRTEngine(std::string mod_name, std::string serialized_engine, CudaDe
   device_info = most_compatible_device.value();
   set_cuda_device(device_info);
 
-  rt = std::shared_ptr<nvinfer1::IRuntime>(nvinfer1::createInferRuntime(util::logging::get_logger()));
+  rt = make_trt(nvinfer1::createInferRuntime(util::logging::get_logger()));
 
   name = slugify(mod_name);
 
-  cuda_engine = std::shared_ptr<nvinfer1::ICudaEngine>(
-      rt->deserializeCudaEngine(serialized_engine.c_str(), serialized_engine.size()));
-  TRTORCH_CHECK((cuda_engine != nullptr), "Unable to deserialize the TensorRT engine");
+  cuda_engine = make_trt(rt->deserializeCudaEngine(serialized_engine.c_str(), serialized_engine.size()));
+  TRTORCH_CHECK((cuda_engine.get() != nullptr), "Unable to deserialize the TensorRT engine");
 
-  exec_ctx = std::shared_ptr<nvinfer1::IExecutionContext>(cuda_engine->createExecutionContext());
+  exec_ctx = make_trt(cuda_engine->createExecutionContext());
 
   uint64_t inputs = 0;
   uint64_t outputs = 0;
diff --git a/core/util/trt_util.cpp b/core/util/trt_util.cpp
@@ -201,7 +201,7 @@ std::vector<int64_t> toVec(nvinfer1::Dims d) {
   for (int i = 0; i < d.nbDims; i++) {
     dims.push_back(d.d[i]);
   }
-  return std::move(dims);
+  return dims;
 }
 
 std::string toStr(nvinfer1::Dims d) {
diff --git a/core/util/trt_util.h b/core/util/trt_util.h
@@ -8,6 +8,30 @@
 
 namespace nvinfer1 {
 
+#if NV_TENSORRT_MAJOR < 8
+
+#define TRT_ENGINE_CAPABILITY_STANDARD nvinfer1::EngineCapability::kDEFAULT
+#define TRT_ENGINE_CAPABILITY_SAFETY nvinfer1::EngineCapability::kSAFE_GPU
+#define TRT_ENGINE_CAPABILITY_DLA_STANDALONE nvinfer1::EngineCapability::kSAFE_DLA
+
+template <class T>
+std::shared_ptr<T> make_trt(T* p) {
+  return std::shared_ptr<T>(p, [](T* p) { p->destroy(); });
+}
+
+#else
+
+#define TRT_ENGINE_CAPABILITY_STANDARD nvinfer1::EngineCapability::kSTANDARD
+#define TRT_ENGINE_CAPABILITY_SAFETY nvinfer1::EngineCapability::kSAFETY
+#define TRT_ENGINE_CAPABILITY_DLA_STANDALONE nvinfer1::EngineCapability::kDLA_STANDALONE
+
+template <class T>
+std::shared_ptr<T> make_trt(T* p) {
+  return std::shared_ptr<T>(p);
+}
+
+#endif
+
 inline std::ostream& operator<<(std::ostream& os, const nvinfer1::TensorFormat& format) {
   switch (format) {
     case nvinfer1::TensorFormat::kLINEAR:
@@ -87,11 +111,11 @@ inline std::ostream& operator<<(std::ostream& stream, const nvinfer1::DeviceType
 
 inline std::ostream& operator<<(std::ostream& stream, const nvinfer1::EngineCapability& cap) {
   switch (cap) {
-    case nvinfer1::EngineCapability::kSTANDARD:
+    case TRT_ENGINE_CAPABILITY_STANDARD:
       return stream << "standard";
-    case nvinfer1::EngineCapability::kSAFETY:
+    case TRT_ENGINE_CAPABILITY_SAFETY:
       return stream << "safety";
-    case nvinfer1::EngineCapability::kDLA_STANDALONE:
+    case TRT_ENGINE_CAPABILITY_DLA_STANDALONE:
       return stream << "DLA standalone";
     default:
       return stream << "Unknown Engine Capability Setting";
diff --git a/cpp/api/src/compile_spec.cpp b/cpp/api/src/compile_spec.cpp
@@ -388,14 +388,14 @@ core::CompileSpec to_internal_compile_spec(CompileSpec external) {
 
   switch (external.capability) {
     case CompileSpec::EngineCapability::kSAFETY:
-      internal.convert_info.engine_settings.capability = nvinfer1::EngineCapability::kSAFETY;
+      internal.convert_info.engine_settings.capability = TRT_ENGINE_CAPABILITY_SAFETY;
       break;
     case CompileSpec::EngineCapability::kDLA_STANDALONE:
-      internal.convert_info.engine_settings.capability = nvinfer1::EngineCapability::kDLA_STANDALONE;
+      internal.convert_info.engine_settings.capability = TRT_ENGINE_CAPABILITY_DLA_STANDALONE;
       break;
     case CompileSpec::EngineCapability::kSTANDARD:
     default:
-      internal.convert_info.engine_settings.capability = nvinfer1::EngineCapability::kSTANDARD;
+      internal.convert_info.engine_settings.capability = TRT_ENGINE_CAPABILITY_STANDARD;
   }
 
   internal.convert_info.engine_settings.device.gpu_id = external.device.gpu_id;
diff --git a/docker/Dockerfile.20.06 b/docker/Dockerfile.20.06
diff --git a/docker/Dockerfile.20.07 b/docker/Dockerfile.20.07
diff --git a/docker/Dockerfile.21.06 b/docker/Dockerfile.21.06
@@ -1,28 +1,30 @@
-FROM nvcr.io/nvidia/pytorch:21.02-py3
+FROM nvcr.io/nvidia/pytorch:21.06-py3 as builder
 
 RUN apt-get update && apt-get install -y curl gnupg  && rm -rf /var/lib/apt/lists/*
 
-RUN curl https://bazel.build/bazel-release.pub.gpg | apt-key add - && \
-    echo "deb [arch=amd64] https://storage.googleapis.com/bazel-apt stable jdk1.8" | tee /etc/apt/sources.list.d/bazel.list
+RUN curl -fsSL https://bazel.build/bazel-release.pub.gpg | gpg --dearmor > bazel.gpg
+RUN mv bazel.gpg /etc/apt/trusted.gpg.d/
+RUN echo "deb [arch=amd64] https://storage.googleapis.com/bazel-apt stable jdk1.8" | tee /etc/apt/sources.list.d/bazel.list
 
 RUN apt-get update && apt-get install -y bazel-4.0.0 && rm -rf /var/lib/apt/lists/*
 RUN ln -s /usr/bin/bazel-4.0.0 /usr/bin/bazel
+# Workaround for bazel expecting both static and shared versions, we only use shared libraries inside container
+RUN cp /usr/lib/x86_64-linux-gnu/libnvinfer.so /usr/lib/x86_64-linux-gnu/libnvinfer_static.a
 
 RUN pip install notebook
 
+FROM builder as trtorch
+
 COPY . /opt/trtorch
 RUN rm /opt/trtorch/WORKSPACE
 COPY ./docker/WORKSPACE.cu.docker  /opt/trtorch/WORKSPACE
 
-# Workaround for bazel expecting both static and shared versions, we only use shared libraries inside container
-RUN cp /usr/lib/x86_64-linux-gnu/libnvinfer.so /usr/lib/x86_64-linux-gnu/libnvinfer_static.a
-
 WORKDIR /opt/trtorch
 RUN bazel build //:libtrtorch --compilation_mode opt
 
 WORKDIR /opt/trtorch/py
 
-RUN pip install ipywidgets
+RUN pip install ipywidgets --trusted-host pypi.org --trusted-host pypi.python.org --trusted-host=files.pythonhosted.org
 RUN jupyter nbextension enable --py widgetsnbextension
 
 # Locale is not set by default
@@ -37,4 +39,4 @@ RUN conda init bash
 ENV LD_LIBRARY_PATH /opt/conda/lib/python3.8/site-packages/torch/lib:$LD_LIBRARY_PATH
 
 WORKDIR /opt/trtorch/
-CMD /bin/bash
+CMD /bin/bash
diff --git a/docker/Dockerfile.21.07 b/docker/Dockerfile.21.07
@@ -1,28 +1,30 @@
-FROM nvcr.io/nvidia/pytorch:20.10-py3
+FROM nvcr.io/nvidia/pytorch:21.07-py3 as builder
 
 RUN apt-get update && apt-get install -y curl gnupg  && rm -rf /var/lib/apt/lists/*
 
-RUN curl https://bazel.build/bazel-release.pub.gpg | apt-key add - && \
-    echo "deb [arch=amd64] https://storage.googleapis.com/bazel-apt stable jdk1.8" | tee /etc/apt/sources.list.d/bazel.list
+RUN curl -fsSL https://bazel.build/bazel-release.pub.gpg | gpg --dearmor > bazel.gpg
+RUN mv bazel.gpg /etc/apt/trusted.gpg.d/
+RUN echo "deb [arch=amd64] https://storage.googleapis.com/bazel-apt stable jdk1.8" | tee /etc/apt/sources.list.d/bazel.list
 
-RUN apt-get update && apt-get install -y bazel-3.7.1 && rm -rf /var/lib/apt/lists/*
-RUN ln -s /usr/bin/bazel-3.7.1 /usr/bin/bazel
+RUN apt-get update && apt-get install -y bazel-4.0.0 && rm -rf /var/lib/apt/lists/*
+RUN ln -s /usr/bin/bazel-4.0.0 /usr/bin/bazel
+# Workaround for bazel expecting both static and shared versions, we only use shared libraries inside container
+RUN cp /usr/lib/x86_64-linux-gnu/libnvinfer.so /usr/lib/x86_64-linux-gnu/libnvinfer_static.a
 
 RUN pip install notebook
 
+FROM builder as trtorch
+
 COPY . /opt/trtorch
 RUN rm /opt/trtorch/WORKSPACE
 COPY ./docker/WORKSPACE.cu.docker  /opt/trtorch/WORKSPACE
 
-# Workaround for bazel expecting both static and shared versions, we only use shared libraries inside container
-RUN cp /usr/lib/x86_64-linux-gnu/libnvinfer.so /usr/lib/x86_64-linux-gnu/libnvinfer_static.a
-
 WORKDIR /opt/trtorch
 RUN bazel build //:libtrtorch --compilation_mode opt
 
 WORKDIR /opt/trtorch/py
 
-RUN pip install ipywidgets
+RUN pip install ipywidgets --trusted-host pypi.org --trusted-host pypi.python.org --trusted-host=files.pythonhosted.org
 RUN jupyter nbextension enable --py widgetsnbextension
 
 # Locale is not set by default
@@ -34,7 +36,7 @@ RUN python3 setup.py install --use-cxx11-abi
 
 RUN conda init bash
 
-ENV LD_LIBRARY_PATH /opt/conda/lib/python3.6/site-packages/torch/lib:$LD_LIBRARY_PATh
+ENV LD_LIBRARY_PATH /opt/conda/lib/python3.8/site-packages/torch/lib:$LD_LIBRARY_PATH
 
 WORKDIR /opt/trtorch/
-CMD /bin/bash
+CMD /bin/bash
diff --git a/py/trtorch/csrc/tensorrt_backend.cpp b/py/trtorch/csrc/tensorrt_backend.cpp
diff --git a/py/trtorch/csrc/tensorrt_classes.cpp b/py/trtorch/csrc/tensorrt_classes.cpp

Original file line number	Diff line number	Diff line change
`@@ -201,7 +201,7 @@ std::vector<int64_t> toVec(nvinfer1::Dims d) {`
`201`	`201`	`for (int i = 0; i < d.nbDims; i++) {`
`202`	`202`	`dims.push_back(d.d[i]);`
`203`	`203`	`}`
`204`		`- return std::move(dims);`
	`204`	`+ return dims;`
`205`	`205`	`}`
`206`	`206`
`207`	`207`	`std::string toStr(nvinfer1::Dims d) {`