update

yf225 · yf225 · commit d4dddaa5707a · 2025-07-14T11:19:00.000-07:00
diff --git a/intermediate_source/fx_conv_bn_fuser.py b/intermediate_source/fx_conv_bn_fuser.py
@@ -1,20 +1,25 @@
 # -*- coding: utf-8 -*-
 """
 Building a Convolution/Batch Norm fuser with torch.compile
-******************************************************************
-**Author**: `Horace He <https://github.com/chillee>`__, `Will Feng <https://github.com/yf225>`__
+===========================================================
 
-In this tutorial, we are going to use torch.compile and its pattern matching
-capabilities to do the following:
+**Author:** `Horace He <https://github.com/chillee>`_, `Will Feng <https://github.com/yf225>`_
 
-1) Find patterns of conv/batch norm in the data dependencies.
-2) For the patterns found in 1), fold the batch norm statistics into the convolution weights.
+.. grid:: 2
 
-Note that this specific optimization only works for models in inference mode (i.e. `mode.eval()`).
-But the pattern matching system in torch.compile works for both training and inference.
+    .. grid-item-card:: :octicon:`mortar-board;1em;` What you will learn
+       :class-card: card-prerequisites
 
-We will demonstrate how to register custom fusion patterns with torch.compile's
-pattern matcher to optimize model performance.
+       * How to register custom fusion patterns with torch.compile's pattern matcher
+
+    .. grid-item-card:: :octicon:`list-unordered;1em;` Prerequisites
+       :class-card: card-prerequisites
+
+       * PyTorch v2.7.0
+
+.. note::
+   This optimization only works for models in inference mode (i.e. ``model.eval()``).
+   However, torch.compile's pattern matching system works for both training and inference.
 
 """
 
diff --git a/intermediate_source/fx_profiling_tutorial.py b/intermediate_source/fx_profiling_tutorial.py
@@ -216,9 +216,6 @@ def summary(self, should_sort : bool = False) -> str:
 #
 # * ``MaxPool2d`` takes up the most time. This is a known issue:
 #   https://github.com/pytorch/pytorch/issues/51393
-# * BatchNorm2d also takes up significant time. We can continue this
-#   line of thinking and optimize this in the Conv-BN Fusion with torch.compile
-#   `tutorial <https://pytorch.org/tutorials/intermediate/torch_compile_conv_bn_fuser.html>`_.
 #
 #
 # Conclusion

Original file line number	Diff line number	Diff line change
`@@ -216,9 +216,6 @@ def summary(self, should_sort : bool = False) -> str:`
`216`	`216`	`#`
`217`	`217`	# * ``MaxPool2d`` takes up the most time. This is a known issue:
`218`	`218`	`# https://github.com/pytorch/pytorch/issues/51393`
`219`		`-# * BatchNorm2d also takes up significant time. We can continue this`
`220`		`-# line of thinking and optimize this in the Conv-BN Fusion with torch.compile`
`221`		-# `tutorial <https://pytorch.org/tutorials/intermediate/torch_compile_conv_bn_fuser.html>`_.
`222`	`219`	`#`
`223`	`220`	`#`
`224`	`221`	`# Conclusion`