pytorch
diff --git a/‎docker/README.md‎
Lines changed: 9 additions & 2 deletions b/‎docker/README.md‎
Lines changed: 9 additions & 2 deletions
diff --git a/‎notebooks/README.md‎
Lines changed: 4 additions & 3 deletions b/‎notebooks/README.md‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎notebooks/Resnet50-example.ipynb‎
Lines changed: 432 additions & 84 deletions b/‎notebooks/Resnet50-example.ipynb‎
Lines changed: 432 additions & 84 deletions
diff --git a/‎notebooks/lenet-getting-started.ipynb‎
Lines changed: 109 additions & 85 deletions b/‎notebooks/lenet-getting-started.ipynb‎
Lines changed: 109 additions & 85 deletions
@@ -1,9 +1,16 @@
+# Building a Torch-TensorRT container
 
-## Use the container for pytorch1.10+cuda11.1+trt8.0.3.4
+### Install Docker and NVIDIA Container Toolkit
+
+https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html
+
+### Build Container
+
+> From root of Torch-TensorRT repo
 
 ```
 # Build:
-docker build -f docker/Dockerfile -t torch_tensorrt1.0:latest .
+docker build --build-arg BASE={PyTorch Base Container Version} -f docker/Dockerfile -t torch_tensorrt1.0:latest .
 
 # Run:
 docker run --gpus all -it \
 
@@ -14,18 +14,20 @@ git clone https://github.com/NVIDIA/Torch-TensorRT
 Next, build the NVIDIA Torch-TensorRT container (from repo root):
 
 ```
+cd Torch-TensorRT
 docker build -t torch_tensorrt -f ./docker/Dockerfile .
 ```
 
 Then launch the container with:
 
 ```
-docker run --runtime=nvidia -it --rm --ipc=host --net=host torch_tensorrt
+docker run --gpus=all --rm -it -v $PWD:/Torch-TensorRT --net=host torch_tensorrt bash
 ```
 
 Within the docker interactive bash session, start Jupyter with
 
 ```
+cd /Torch-TensorRT/notebooks
 jupyter notebook --allow-root --ip 0.0.0.0 --port 8888
 ```
 
@@ -38,8 +40,7 @@ in, for example:
 ```http://[host machine]:8888/?token=aae96ae9387cd28151868fee318c3b3581a2d794f3b25c6b```
 
 
-Within the container, the notebooks themselves are located at `/workspace/torch_tensorrt/notebooks`. To reach them in Jupyter, click on the folder marked 
-`torch_tensorrt`, then the folder marked `notebooks`.
+Within the container, the notebooks themselves are located at `/Torch-TensorRT/notebooks`.
 
 ## 2. Notebook list
 
 
@@ -215,43 +215,27 @@
   {
    "cell_type": "code",
    "execution_count": 5,
-   "metadata": {
-    "scrolled": false
-   },
+   "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Warm up ...\n"
-     ]
-    },
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/opt/conda/lib/python3.8/site-packages/torch/nn/functional.py:718: UserWarning: Named tensors and all their associated APIs are an experimental feature and subject to change. Please do not use them for anything important until they are released as stable. (Triggered internally at  ../c10/core/TensorImpl.h:1153.)\n",
-      "  return torch.max_pool2d(input, kernel_size, stride, padding, dilation, ceil_mode)\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
+      "Warm up ...\n",
       "Start timing ...\n",
-      "Iteration 100/1000, ave batch time 5.14 ms\n",
-      "Iteration 200/1000, ave batch time 5.13 ms\n",
-      "Iteration 300/1000, ave batch time 5.13 ms\n",
-      "Iteration 400/1000, ave batch time 5.13 ms\n",
-      "Iteration 500/1000, ave batch time 5.13 ms\n",
-      "Iteration 600/1000, ave batch time 5.13 ms\n",
-      "Iteration 700/1000, ave batch time 5.13 ms\n",
-      "Iteration 800/1000, ave batch time 5.13 ms\n",
-      "Iteration 900/1000, ave batch time 5.13 ms\n",
-      "Iteration 1000/1000, ave batch time 5.13 ms\n",
+      "Iteration 100/1000, ave batch time 5.22 ms\n",
+      "Iteration 200/1000, ave batch time 5.22 ms\n",
+      "Iteration 300/1000, ave batch time 5.22 ms\n",
+      "Iteration 400/1000, ave batch time 5.22 ms\n",
+      "Iteration 500/1000, ave batch time 5.22 ms\n",
+      "Iteration 600/1000, ave batch time 5.21 ms\n",
+      "Iteration 700/1000, ave batch time 5.22 ms\n",
+      "Iteration 800/1000, ave batch time 5.21 ms\n",
+      "Iteration 900/1000, ave batch time 5.21 ms\n",
+      "Iteration 1000/1000, ave batch time 5.21 ms\n",
       "Input shape: torch.Size([1024, 1, 32, 32])\n",
       "Output features size: torch.Size([1024, 10])\n",
-      "Average batch time: 5.13 ms\n"
+      "Average batch time: 5.21 ms\n"
      ]
     }
    ],
@@ -315,19 +299,19 @@
      "text": [
       "Warm up ...\n",
       "Start timing ...\n",
-      "Iteration 100/1000, ave batch time 5.13 ms\n",
-      "Iteration 200/1000, ave batch time 5.13 ms\n",
-      "Iteration 300/1000, ave batch time 5.13 ms\n",
-      "Iteration 400/1000, ave batch time 5.13 ms\n",
-      "Iteration 500/1000, ave batch time 5.13 ms\n",
-      "Iteration 600/1000, ave batch time 5.13 ms\n",
-      "Iteration 700/1000, ave batch time 5.13 ms\n",
-      "Iteration 800/1000, ave batch time 5.13 ms\n",
-      "Iteration 900/1000, ave batch time 5.13 ms\n",
-      "Iteration 1000/1000, ave batch time 5.13 ms\n",
+      "Iteration 100/1000, ave batch time 5.22 ms\n",
+      "Iteration 200/1000, ave batch time 5.21 ms\n",
+      "Iteration 300/1000, ave batch time 5.21 ms\n",
+      "Iteration 400/1000, ave batch time 5.21 ms\n",
+      "Iteration 500/1000, ave batch time 5.22 ms\n",
+      "Iteration 600/1000, ave batch time 5.22 ms\n",
+      "Iteration 700/1000, ave batch time 5.22 ms\n",
+      "Iteration 800/1000, ave batch time 5.22 ms\n",
+      "Iteration 900/1000, ave batch time 5.22 ms\n",
+      "Iteration 1000/1000, ave batch time 5.22 ms\n",
       "Input shape: torch.Size([1024, 1, 32, 32])\n",
       "Output features size: torch.Size([1024, 10])\n",
-      "Average batch time: 5.13 ms\n"
+      "Average batch time: 5.22 ms\n"
      ]
     }
    ],
@@ -398,19 +382,19 @@
      "text": [
       "Warm up ...\n",
       "Start timing ...\n",
-      "Iteration 100/1000, ave batch time 5.16 ms\n",
-      "Iteration 200/1000, ave batch time 5.15 ms\n",
-      "Iteration 300/1000, ave batch time 5.14 ms\n",
-      "Iteration 400/1000, ave batch time 5.14 ms\n",
-      "Iteration 500/1000, ave batch time 5.14 ms\n",
-      "Iteration 600/1000, ave batch time 5.14 ms\n",
-      "Iteration 700/1000, ave batch time 5.14 ms\n",
-      "Iteration 800/1000, ave batch time 5.14 ms\n",
-      "Iteration 900/1000, ave batch time 5.14 ms\n",
-      "Iteration 1000/1000, ave batch time 5.14 ms\n",
+      "Iteration 100/1000, ave batch time 5.21 ms\n",
+      "Iteration 200/1000, ave batch time 5.21 ms\n",
+      "Iteration 300/1000, ave batch time 5.27 ms\n",
+      "Iteration 400/1000, ave batch time 5.28 ms\n",
+      "Iteration 500/1000, ave batch time 5.27 ms\n",
+      "Iteration 600/1000, ave batch time 5.26 ms\n",
+      "Iteration 700/1000, ave batch time 5.26 ms\n",
+      "Iteration 800/1000, ave batch time 5.25 ms\n",
+      "Iteration 900/1000, ave batch time 5.25 ms\n",
+      "Iteration 1000/1000, ave batch time 5.25 ms\n",
       "Input shape: torch.Size([1024, 1, 32, 32])\n",
       "Output features size: torch.Size([1024, 10])\n",
-      "Average batch time: 5.14 ms\n"
+      "Average batch time: 5.25 ms\n"
      ]
     }
    ],
@@ -437,9 +421,29 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 17,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "WARNING: [Torch-TensorRT] - For input x.1, found user specified input dtype as Float16, however when inspecting the graph, the input type expected was inferred to be Float\n",
+      "The compiler is going to use the user setting Float16\n",
+      "This conflict may cause an error at runtime due to partial compilation being enabled and therefore\n",
+      "compatibility with PyTorch's data type convention is required.\n",
+      "If you do indeed see errors at runtime either:\n",
+      "- Remove the dtype spec for x.1\n",
+      "- Disable partial compilation by setting require_full_compilation to True\n",
+      "WARNING: [Torch-TensorRT TorchScript Conversion Context] - The logger passed into createInferBuilder differs from one already provided for an existing builder, runtime, or refitter. TensorRT maintains only a single logger pointer at any given time, so the existing value, which can be retrieved with getLogger(), will be used instead. In order to use a new logger, first destroy all existing builder, runner or refitter objects.\n",
+      "\n",
+      "WARNING: [Torch-TensorRT] - Dilation not used in Max pooling converter\n",
+      "WARNING: [Torch-TensorRT] - Dilation not used in Max pooling converter\n",
+      "WARNING: [Torch-TensorRT] - Detected invalid timing cache, setup a local cache instead\n",
+      "WARNING: [Torch-TensorRT] - Max value of this profile is not valid\n"
+     ]
+    }
+   ],
    "source": [
     "import torch_tensorrt\n",
     "\n",
@@ -451,10 +455,10 @@
     "            max_shape=[1024, 1, 34, 34],\n",
     "            dtype=torch.half\n",
     "        )],\n",
-    "    \"enabled_precisions\": {torch.float, torch.half} # Run with FP16\n",
+    "    \"enabled_precisions\": {torch.half} # Run with FP16\n",
     "}\n",
     "\n",
-    "trt_ts_module = torch_tensorrt.compile(traced_model, compile_settings)\n",
+    "trt_ts_module = torch_tensorrt.compile(traced_model, **compile_settings)\n",
     "\n",
     "input_data = torch.randn((1024, 1, 32, 32))\n",
     "input_data = input_data.half().to(\"cuda\")\n",
@@ -466,7 +470,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 20,
    "metadata": {},
    "outputs": [
     {
@@ -475,19 +479,19 @@
      "text": [
       "Warm up ...\n",
       "Start timing ...\n",
-      "Iteration 100/1000, ave batch time 2.00 ms\n",
-      "Iteration 200/1000, ave batch time 1.97 ms\n",
-      "Iteration 300/1000, ave batch time 1.98 ms\n",
-      "Iteration 400/1000, ave batch time 1.98 ms\n",
-      "Iteration 500/1000, ave batch time 1.99 ms\n",
-      "Iteration 600/1000, ave batch time 1.99 ms\n",
-      "Iteration 700/1000, ave batch time 1.99 ms\n",
-      "Iteration 800/1000, ave batch time 1.99 ms\n",
-      "Iteration 900/1000, ave batch time 1.98 ms\n",
-      "Iteration 1000/1000, ave batch time 1.98 ms\n",
+      "Iteration 100/1000, ave batch time 2.47 ms\n",
+      "Iteration 200/1000, ave batch time 2.40 ms\n",
+      "Iteration 300/1000, ave batch time 2.35 ms\n",
+      "Iteration 400/1000, ave batch time 2.35 ms\n",
+      "Iteration 500/1000, ave batch time 2.35 ms\n",
+      "Iteration 600/1000, ave batch time 2.35 ms\n",
+      "Iteration 700/1000, ave batch time 2.36 ms\n",
+      "Iteration 800/1000, ave batch time 2.35 ms\n",
+      "Iteration 900/1000, ave batch time 2.91 ms\n",
+      "Iteration 1000/1000, ave batch time 2.85 ms\n",
       "Input shape: torch.Size([1024, 1, 32, 32])\n",
       "Output features size: torch.Size([1024, 10])\n",
-      "Average batch time: 1.98 ms\n"
+      "Average batch time: 2.85 ms\n"
      ]
     }
    ],
@@ -506,9 +510,29 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
+   "execution_count": 21,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "WARNING: [Torch-TensorRT] - For input x.1, found user specified input dtype as Float16, however when inspecting the graph, the input type expected was inferred to be Float\n",
+      "The compiler is going to use the user setting Float16\n",
+      "This conflict may cause an error at runtime due to partial compilation being enabled and therefore\n",
+      "compatibility with PyTorch's data type convention is required.\n",
+      "If you do indeed see errors at runtime either:\n",
+      "- Remove the dtype spec for x.1\n",
+      "- Disable partial compilation by setting require_full_compilation to True\n",
+      "WARNING: [Torch-TensorRT TorchScript Conversion Context] - The logger passed into createInferBuilder differs from one already provided for an existing builder, runtime, or refitter. TensorRT maintains only a single logger pointer at any given time, so the existing value, which can be retrieved with getLogger(), will be used instead. In order to use a new logger, first destroy all existing builder, runner or refitter objects.\n",
+      "\n",
+      "WARNING: [Torch-TensorRT] - Dilation not used in Max pooling converter\n",
+      "WARNING: [Torch-TensorRT] - Dilation not used in Max pooling converter\n",
+      "WARNING: [Torch-TensorRT] - Detected invalid timing cache, setup a local cache instead\n",
+      "WARNING: [Torch-TensorRT] - Max value of this profile is not valid\n"
+     ]
+    }
+   ],
    "source": [
     "import torch_tensorrt\n",
     "\n",
@@ -520,10 +544,10 @@
     "            max_shape=[1024, 1, 34, 34],\n",
     "            dtype=torch.half\n",
     "        )],\n",
-    "    \"enabled_precisions\": {torch.float, torch.half} # Run with FP16\n",
+    "    \"enabled_precisions\": {torch.half} # Run with FP16\n",
     "}\n",
     "\n",
-    "trt_script_module = torch_tensorrt.compile(script_model, compile_settings)\n",
+    "trt_script_module = torch_tensorrt.compile(script_model, **compile_settings)\n",
     "\n",
     "input_data = torch.randn((1024, 1, 32, 32))\n",
     "input_data = input_data.half().to(\"cuda\")\n",
@@ -535,7 +559,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": 22,
    "metadata": {},
    "outputs": [
     {
@@ -544,19 +568,19 @@
      "text": [
       "Warm up ...\n",
       "Start timing ...\n",
-      "Iteration 100/1000, ave batch time 2.02 ms\n",
-      "Iteration 200/1000, ave batch time 1.98 ms\n",
-      "Iteration 300/1000, ave batch time 1.97 ms\n",
-      "Iteration 400/1000, ave batch time 1.96 ms\n",
-      "Iteration 500/1000, ave batch time 1.96 ms\n",
-      "Iteration 600/1000, ave batch time 1.96 ms\n",
-      "Iteration 700/1000, ave batch time 1.96 ms\n",
-      "Iteration 800/1000, ave batch time 1.96 ms\n",
-      "Iteration 900/1000, ave batch time 1.96 ms\n",
-      "Iteration 1000/1000, ave batch time 1.96 ms\n",
+      "Iteration 100/1000, ave batch time 2.34 ms\n",
+      "Iteration 200/1000, ave batch time 2.34 ms\n",
+      "Iteration 300/1000, ave batch time 2.35 ms\n",
+      "Iteration 400/1000, ave batch time 2.36 ms\n",
+      "Iteration 500/1000, ave batch time 2.58 ms\n",
+      "Iteration 600/1000, ave batch time 3.26 ms\n",
+      "Iteration 700/1000, ave batch time 3.13 ms\n",
+      "Iteration 800/1000, ave batch time 3.02 ms\n",
+      "Iteration 900/1000, ave batch time 2.96 ms\n",
+      "Iteration 1000/1000, ave batch time 2.90 ms\n",
       "Input shape: torch.Size([1024, 1, 32, 32])\n",
       "Output features size: torch.Size([1024, 10])\n",
-      "Average batch time: 1.96 ms\n"
+      "Average batch time: 2.90 ms\n"
      ]
     }
    ],
@@ -579,7 +603,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3 (ipykernel)",
    "language": "python",
    "name": "python3"
   },
@@ -593,7 +617,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.6.13"
+   "version": "3.8.10"
   }
  },
  "nbformat": 4,