pytorch
diff --git a/‎.circleci/config.yml‎
Lines changed: 1 addition & 1 deletion b/‎.circleci/config.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎docsrc/conf.py‎
Lines changed: 12 additions & 2 deletions b/‎docsrc/conf.py‎
Lines changed: 12 additions & 2 deletions
diff --git a/‎examples/custom_converters/elu_model.py‎
Lines changed: 3 additions & 1 deletion b/‎examples/custom_converters/elu_model.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎examples/fx/fx2trt_example.py‎
Lines changed: 3 additions & 1 deletion b/‎examples/fx/fx2trt_example.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎examples/fx/hugging_face_torchdynamo_example.py‎
Lines changed: 9 additions & 3 deletions b/‎examples/fx/hugging_face_torchdynamo_example.py‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎examples/fx/lower_example.py‎
Lines changed: 4 additions & 1 deletion b/‎examples/fx/lower_example.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎examples/fx/quantized_resnet_test.py‎
Lines changed: 3 additions & 1 deletion b/‎examples/fx/quantized_resnet_test.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎examples/fx/torch_trt_simple_example.py‎
Lines changed: 36 additions & 8 deletions b/‎examples/fx/torch_trt_simple_example.py‎
Lines changed: 36 additions & 8 deletions
diff --git a/‎examples/fx/torchdynamo_example.py‎
Lines changed: 4 additions & 1 deletion b/‎examples/fx/torchdynamo_example.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎examples/int8/training/vgg16/export_ckpt.py‎
Lines changed: 3 additions & 1 deletion b/‎examples/int8/training/vgg16/export_ckpt.py‎
Lines changed: 3 additions & 1 deletion
@@ -751,7 +751,7 @@ parameters:
   # Nightly platform config
   torch-nightly-build:
     type: string
-    default: "1.13.0.dev20220731+cu113"
+    default: "1.13.0.dev20220810+cu113"
   torch-nightly-build-index:
     type: string
     default: "https://download.pytorch.org/whl/nightly/cu113"
 
@@ -99,7 +99,9 @@
 }
 
 html_show_sourcelink = True
-html_sidebars = {"**": ["logo-text.html", "globaltoc.html", "localtoc.html", "searchbox.html"]}
+html_sidebars = {
+    "**": ["logo-text.html", "globaltoc.html", "localtoc.html", "searchbox.html"]
+}
 
 # extensions.append("sphinx_material")
 html_theme_path = [pytorch_sphinx_theme.get_html_theme_path()]
@@ -183,7 +185,15 @@ def handle_item(fieldarg, content):
                 typename = typename.replace("long", "python:long")
                 typename = typename.replace("float", "python:float")
                 typename = typename.replace("type", "python:type")
-                par.extend(self.make_xrefs(self.typerolename, domain, typename, addnodes.literal_emphasis, **kw))
+                par.extend(
+                    self.make_xrefs(
+                        self.typerolename,
+                        domain,
+                        typename,
+                        addnodes.literal_emphasis,
+                        **kw
+                    )
+                )
             else:
                 par += fieldtype
             par += nodes.Text(")")
 
@@ -2,7 +2,9 @@
 import torch_tensorrt
 
 # After "python3 setup install", you should find this .so file under generated "build" directory
-torch.ops.load_library("./elu_converter/build/lib.linux-x86_64-3.6/elu_converter.cpython-36m-x86_64-linux-gnu.so")
+torch.ops.load_library(
+    "./elu_converter/build/lib.linux-x86_64-3.6/elu_converter.cpython-36m-x86_64-linux-gnu.so"
+)
 
 
 class Elu(torch.nn.Module):
 
@@ -141,4 +141,6 @@ def get_input(self, inputs):
 
 # Make sure the results match
 regular_model_output = model(*inputs)
-torch.testing.assert_close(reload_model_output, regular_model_output, atol=3e-3, rtol=1e-2)
+torch.testing.assert_close(
+    reload_model_output, regular_model_output, atol=3e-3, rtol=1e-2
+)
@@ -353,14 +353,18 @@ def run_all_eval(args, optimize_ctx, optimize_name, dtype):
             eval_inputs = (input_ids,)
 
         # Correctness check
-        is_accurate = check_correctness(args, model, eval_inputs, optimize_ctx, optimize_name)
+        is_accurate = check_correctness(
+            args, model, eval_inputs, optimize_ctx, optimize_name
+        )
         # Profile eager
         t, m = bench_model_eval(args, "eager", model, eval_inputs, NullContext())
         results.append(create_record(model_name, dtype, is_accurate, "eager", t, m))
 
         # Profile Dynamo nvfuser
         t, m = bench_model_eval(args, optimize_name, model, eval_inputs, optimize_ctx)
-        results.append(create_record(model_name, dtype, is_accurate, optimize_name, t, m))
+        results.append(
+            create_record(model_name, dtype, is_accurate, optimize_name, t, m)
+        )
 
         # calculate relative improvements
         base_r = results[-2]
@@ -412,7 +416,9 @@ def main():
     if optimize_name == "dynamo_fx2trt_fp32":
         experiment = partial(experiment, dtype=torch.float32)
 
-    experiment = partial(experiment, optimize_ctx=optimize_ctx, optimize_name=optimize_name)
+    experiment = partial(
+        experiment, optimize_ctx=optimize_ctx, optimize_name=optimize_name
+    )
     experiment(args)
 
 
 
@@ -125,7 +125,10 @@ def benchmark(
         ),
     ]
 
-    results = [run_configuration_benchmark(deepcopy(model), inputs, conf_) for conf_ in configurations]
+    results = [
+        run_configuration_benchmark(deepcopy(model), inputs, conf_)
+        for conf_ in configurations
+    ]
 
     for res in results:
         print(res.format())
 
@@ -108,7 +108,9 @@ def build_int8_trt_implicit_quant(rn18):
         InputTensorSpec.from_tensors([data]),
         logger_level=trt.Logger.VERBOSE,
     )
-    interpreter_result = interp.run(lower_precision=LowerPrecision.INT8, strict_type_constraints=True)
+    interpreter_result = interp.run(
+        lower_precision=LowerPrecision.INT8, strict_type_constraints=True
+    )
     trt_mod = TRTModule(
         interpreter_result.engine,
         interpreter_result.input_names,
 
@@ -12,35 +12,63 @@ def test_torch_tensorrt(model, inputs):
     # fp32 test
     with torch.inference_mode():
         ref_fp32 = model_ts(*inputs_ts)
-    trt_ts_module = torch_tensorrt.compile(model_ts, inputs=inputs_ts, enabled_precisions={torch.float32})
+    trt_ts_module = torch_tensorrt.compile(
+        model_ts, inputs=inputs_ts, enabled_precisions={torch.float32}
+    )
     result_fp32 = trt_ts_module(*inputs_ts)
-    assert torch.nn.functional.cosine_similarity(ref_fp32.flatten(), result_fp32.flatten(), dim=0) > 0.9999
+    assert (
+        torch.nn.functional.cosine_similarity(
+            ref_fp32.flatten(), result_fp32.flatten(), dim=0
+        )
+        > 0.9999
+    )
     # fp16 test
     model_ts = model_ts.half()
     inputs_ts = [i.cuda().half() for i in inputs_ts]
     with torch.inference_mode():
         ref_fp16 = model_ts(*inputs_ts)
-    trt_ts_module = torch_tensorrt.compile(model_ts, inputs=inputs_ts, enabled_precisions={torch.float16})
+    trt_ts_module = torch_tensorrt.compile(
+        model_ts, inputs=inputs_ts, enabled_precisions={torch.float16}
+    )
     result_fp16 = trt_ts_module(*inputs_ts)
-    assert torch.nn.functional.cosine_similarity(ref_fp16.flatten(), result_fp16.flatten(), dim=0) > 0.99
+    assert (
+        torch.nn.functional.cosine_similarity(
+            ref_fp16.flatten(), result_fp16.flatten(), dim=0
+        )
+        > 0.99
+    )
 
     # FX path
     model_fx = copy.deepcopy(model)
     inputs_fx = copy.deepcopy(inputs)
     # fp32 test
     with torch.inference_mode():
         ref_fp32 = model_fx(*inputs_fx)
-    trt_fx_module = torch_tensorrt.compile(model_fx, ir="fx", inputs=inputs_fx, enabled_precisions={torch.float32})
+    trt_fx_module = torch_tensorrt.compile(
+        model_fx, ir="fx", inputs=inputs_fx, enabled_precisions={torch.float32}
+    )
     result_fp32 = trt_fx_module(*inputs_fx)
-    assert torch.nn.functional.cosine_similarity(ref_fp32.flatten(), result_fp32.flatten(), dim=0) > 0.9999
+    assert (
+        torch.nn.functional.cosine_similarity(
+            ref_fp32.flatten(), result_fp32.flatten(), dim=0
+        )
+        > 0.9999
+    )
     # fp16 test
     model_fx = model_fx.cuda().half()
     inputs_fx = [i.cuda().half() for i in inputs_fx]
     with torch.inference_mode():
         ref_fp16 = model_fx(*inputs_fx)
-    trt_fx_module = torch_tensorrt.compile(model_fx, ir="fx", inputs=inputs_fx, enabled_precisions={torch.float16})
+    trt_fx_module = torch_tensorrt.compile(
+        model_fx, ir="fx", inputs=inputs_fx, enabled_precisions={torch.float16}
+    )
     result_fp16 = trt_fx_module(*inputs_fx)
-    assert torch.nn.functional.cosine_similarity(ref_fp16.flatten(), result_fp16.flatten(), dim=0) > 0.99
+    assert (
+        torch.nn.functional.cosine_similarity(
+            ref_fp16.flatten(), result_fp16.flatten(), dim=0
+        )
+        > 0.99
+    )
 
 
 if __name__ == "__main__":
 
@@ -142,7 +142,10 @@ def benchmark(
         ),
     ]
 
-    results = [run_configuration_benchmark(deepcopy(model), inputs, conf_) for conf_ in configurations]
+    results = [
+        run_configuration_benchmark(deepcopy(model), inputs, conf_)
+        for conf_ in configurations
+    ]
 
     for res in results:
         print(res.format())
 
@@ -75,7 +75,9 @@ def test(model, dataloader, crit):
     ),
 )
 
-testing_dataloader = torch.utils.data.DataLoader(testing_dataset, batch_size=32, shuffle=False, num_workers=2)
+testing_dataloader = torch.utils.data.DataLoader(
+    testing_dataset, batch_size=32, shuffle=False, num_workers=2
+)
 
 crit = torch.nn.CrossEntropyLoss()
Original file line number	Diff line number	Diff line change
`@@ -75,7 +75,9 @@ def test(model, dataloader, crit):`
`75`	`75`	`),`
`76`	`76`	`)`
`77`	`77`
`78`		`-testing_dataloader = torch.utils.data.DataLoader(testing_dataset, batch_size=32, shuffle=False, num_workers=2)`
	`78`	`+testing_dataloader = torch.utils.data.DataLoader(`
	`79`	`+ testing_dataset, batch_size=32, shuffle=False, num_workers=2`
	`80`	`+)`
`79`	`81`
`80`	`82`	`crit = torch.nn.CrossEntropyLoss()`
`81`	`83`