sandeepgupta12
diff --git a/‎test/dynamo/test_aot_autograd_cache.py‎
Lines changed: 40 additions & 0 deletions b/‎test/dynamo/test_aot_autograd_cache.py‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎test/dynamo/test_backward_higher_order_ops.py‎
Lines changed: 2 additions & 2 deletions b/‎test/dynamo/test_backward_higher_order_ops.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎test/dynamo/test_comptime.py‎
Lines changed: 5 additions & 5 deletions b/‎test/dynamo/test_comptime.py‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎test/dynamo/test_exc.py‎
Lines changed: 32 additions & 32 deletions b/‎test/dynamo/test_exc.py‎
Lines changed: 32 additions & 32 deletions
diff --git a/‎test/dynamo/test_export.py‎
Lines changed: 5 additions & 5 deletions b/‎test/dynamo/test_export.py‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎test/dynamo/test_functions.py‎
Lines changed: 18 additions & 18 deletions b/‎test/dynamo/test_functions.py‎
Lines changed: 18 additions & 18 deletions
@@ -196,6 +196,46 @@ def fn(x, y):
         self.assertEqual(counters["aot_autograd"]["autograd_cache_hit"], 1)
         self.assertEqual(counters["aot_autograd"]["autograd_cache_saved"], 1)
 
+    @inductor_config.patch("fx_graph_remote_cache", False)
+    @inductor_config.patch("fx_graph_cache", True)
+    @functorch_config.patch({"enable_autograd_cache": True})
+    def test_symbol_specialization(self):
+        """
+        Verify the symbol specializations don't cause cache miss.
+        """
+
+        def fn(x, y, z):
+            return (torch.randn(5) + x + y, z * torch.randn(1))
+
+        a = torch.rand(5)
+        torch._dynamo.maybe_mark_dynamic(a, 0)
+        b = torch.rand(5)
+        c = torch.randn(6)
+        torch._dynamo.maybe_mark_dynamic(c, 0)
+
+        compiled_fn = torch.compile(fn, backend="inductor")
+
+        # A first call should miss in the cache.
+        compiled_fn(a, b, c)
+        self.assertEqual(counters["aot_autograd"]["autograd_cache_miss"], 1)
+        self.assertEqual(counters["aot_autograd"]["autograd_cache_hit"], 0)
+        self.assertEqual(counters["aot_autograd"]["autograd_cache_saved"], 1)
+
+        # A second call should hit even if a new dimension is marked as dynamic
+        # that is later specialized as part of tracing.
+        a = torch.rand(5)
+        torch._dynamo.maybe_mark_dynamic(a, 0)
+        b = torch.rand(5)
+        torch._dynamo.maybe_mark_dynamic(b, 0)
+        c = torch.randn(6)
+        torch._dynamo.maybe_mark_dynamic(c, 0)
+        self._clear_dynamo_and_codecache()
+
+        compiled_fn(a, b, c)
+        self.assertEqual(counters["aot_autograd"]["autograd_cache_miss"], 1)
+        self.assertEqual(counters["aot_autograd"]["autograd_cache_hit"], 1)
+        self.assertEqual(counters["aot_autograd"]["autograd_cache_saved"], 1)
+
     @functorch_config.patch({"enable_autograd_cache": True})
     def test_aot_runtime_trace_joint(self):
         @torch.compile(backend="inductor")
 
@@ -245,7 +245,7 @@ def fn(x, y):
                     actual,
                     """\
 class GraphModule(torch.nn.Module):
-    def forward(self, L_inputs_ : list, L_sizes_0_: "Sym(2)", L_hooks_1_keywords_fn_keywords_obj_counter: "Sym(s7)"):
+    def forward(self, L_inputs_ : list, L_sizes_0_: "Sym(2)", L_hooks_1_keywords_fn_keywords_obj_counter: "Sym(s45)"):
         l_inputs_ = L_inputs_
         l_sizes_0_ = L_sizes_0_
         l_hooks_1_keywords_fn_keywords_obj_counter = L_hooks_1_keywords_fn_keywords_obj_counter
@@ -264,7 +264,7 @@ def forward(self, L_inputs_ : list, L_sizes_0_: "Sym(2)", L_hooks_1_keywords_fn_
 
         copy_: "f32[2]" = new_grad_strided.copy_(aot0_tangents_1);  copy_ = None
 
-        add: "Sym(s7 + 1)" = l_hooks_1_keywords_fn_keywords_obj_counter + 1;  l_hooks_1_keywords_fn_keywords_obj_counter = None
+        add: "Sym(s45 + 1)" = l_hooks_1_keywords_fn_keywords_obj_counter + 1;  l_hooks_1_keywords_fn_keywords_obj_counter = None
 
         result: "f32[2]" = aot0_tangents_1 * aot0_tangents_1;  aot0_tangents_1 = None
 
 
@@ -57,18 +57,18 @@ def f(x):
         self.assertExpectedInline(
             FILE.getvalue().strip(),
             """\
-FakeTensor(..., size=(s0,))
+FakeTensor(..., size=(s77,))
 2
-[FakeTensor(..., size=(s0,)), 2]
-(FakeTensor(..., size=(s0,)), 2)
-{'foo': FakeTensor(..., size=(s0,))}
+[FakeTensor(..., size=(s77,)), 2]
+(FakeTensor(..., size=(s77,)), 2)
+{'foo': FakeTensor(..., size=(s77,))}
 range(1, 3, 1)
 Employee(name='foo', id=2)
 UserDefinedListVariable(mylist)
 defaultdict(NestedUserFunctionVariable(), {})
 set()
 {'a','b'}
-s0""",
+s77""",
         )
 
     def test_print_graph(self):
 
@@ -256,34 +256,34 @@ def fn(x, shape):
   ==> L['x'].size()[0]: 3
   ==> L['x'].storage_offset(): 0
   ==> L['x'].stride()[0]: 1
-  ==> s0: 3
-  ==> s1: 0
-  ==> s2: 1
   ==> s3: 1
+  ==> s52: 1
+  ==> s77: 3
+  ==> s86: 0
 
 Assertions:
   ==> (== 0 L['x'].storage_offset())
   ==> (== 1 L['x'].stride()[0])
-  ==> (== L['shape'][0] s1)
-  ==> (== L['shape'][1] s2)
+  ==> (== L['shape'][0] s86)
+  ==> (== L['shape'][1] s52)
   ==> (== L['shape'][2] s3)
-  ==> (== L['x'].size()[0] s0)
-  ==> (> s0 1)
+  ==> (== L['x'].size()[0] s77)
+  ==> (> s77 1)
 
 Target Expressions:
-  ==> (!= (+ s1 s2 s3) s0)
-  ==> (<= 0 s1)
-  ==> (<= 0 s2)
+  ==> (!= (+ s3 s52 s86) s77)
   ==> (<= 0 s3)
-  ==> (<= 2 s0)
+  ==> (<= 0 s52)
+  ==> (<= 0 s86)
+  ==> (<= 2 s77)
   ==> (== 0 L['x'].storage_offset())
   ==> (== 1 L['x'].stride()[0])
-  ==> (== L['shape'][0] s1)
-  ==> (== L['shape'][1] s2)
+  ==> (== L['shape'][0] s86)
+  ==> (== L['shape'][1] s52)
   ==> (== L['shape'][2] s3)
-  ==> (== L['x'].size()[0] s0)
-  ==> (> s0 0)
-  ==> (>= 0 s1)
+  ==> (== L['x'].size()[0] s77)
+  ==> (> s77 0)
+  ==> (>= 0 s86)
 
 Failed Source Expressions:
   ==> (== (+ L['shape'][0] L['shape'][1] L['shape'][2]) L['x'].size()[0])""",
@@ -309,7 +309,7 @@ def fn(x, shape):
             BisectValidationException,
             lambda: fn(torch.randn(20), (5, 10, 5)),
             """\
-translation validation failed when evaluating: Eq(s1 + s2 + s3, s0)
+translation validation failed when evaluating: Eq(s3 + s52 + s86, s77)
 
 Failure occurred while running node:
     %split : [num_users=3] = call_method[target=split](args = (%l_x_, (%l_shape_0_, %l_shape_1_, %l_shape_2_)), kwargs = {})
@@ -321,33 +321,33 @@ def fn(x, shape):
   ==> L['x'].size()[0]: 3
   ==> L['x'].storage_offset(): 0
   ==> L['x'].stride()[0]: 1
-  ==> s0: 3
-  ==> s1: 1
-  ==> s2: 1
   ==> s3: 0
+  ==> s52: 1
+  ==> s77: 3
+  ==> s86: 1
 
 Assertions:
   ==> (== 0 L['x'].storage_offset())
   ==> (== 1 L['x'].stride()[0])
-  ==> (== L['shape'][0] s1)
-  ==> (== L['shape'][1] s2)
+  ==> (== L['shape'][0] s86)
+  ==> (== L['shape'][1] s52)
   ==> (== L['shape'][2] s3)
-  ==> (== L['x'].size()[0] s0)
-  ==> (> s0 1)
+  ==> (== L['x'].size()[0] s77)
+  ==> (> s77 1)
 
 Target Expressions:
-  ==> (!= (+ s1 s2 s3) s0)
-  ==> (<= 0 s1)
-  ==> (<= 0 s2)
+  ==> (!= (+ s3 s52 s86) s77)
   ==> (<= 0 s3)
-  ==> (<= 2 s0)
+  ==> (<= 0 s52)
+  ==> (<= 0 s86)
+  ==> (<= 2 s77)
   ==> (== 0 L['x'].storage_offset())
   ==> (== 1 L['x'].stride()[0])
-  ==> (== L['shape'][0] s1)
-  ==> (== L['shape'][1] s2)
+  ==> (== L['shape'][0] s86)
+  ==> (== L['shape'][1] s52)
   ==> (== L['shape'][2] s3)
-  ==> (== L['x'].size()[0] s0)
-  ==> (> s0 0)
+  ==> (== L['x'].size()[0] s77)
+  ==> (> s77 0)
 
 Failed Source Expressions:
   ==> (== (+ L['shape'][0] L['shape'][1] L['shape'][2]) L['x'].size()[0])""",
 
@@ -2703,7 +2703,7 @@ def forward(self, x, y):
                 for node in ebar.graph_module.graph.nodes
                 if node.op == "placeholder"
             ],
-            ["torch.Size([s0, s1, s1])", "torch.Size([s0, s1, s1])"],
+            ["torch.Size([s17, s27, s27])", "torch.Size([s17, s27, s27])"],
         )
 
     @torch._dynamo.config.patch(
@@ -3480,23 +3480,23 @@ def test_symbool_guards(
         true_graph = """\
 class GraphModule(torch.nn.Module):
     def forward(self, pred, x):
-        arg1: "f32[s1, s2]";
+        arg1: "f32[s77, s27]";
 
         arg0, arg1, = fx_pytree.tree_flatten_spec(([pred, x], {}), self._in_spec)
         l_x_ = arg1
 
-        sin: "f32[s1, s2]" = l_x_.sin();  l_x_ = None
+        sin: "f32[s77, s27]" = l_x_.sin();  l_x_ = None
         return pytree.tree_unflatten([sin], self._out_spec)
 """
         false_graph = """\
 class GraphModule(torch.nn.Module):
     def forward(self, pred, x):
-        arg1: "f32[s1, s2]";
+        arg1: "f32[s77, s27]";
 
         arg0, arg1, = fx_pytree.tree_flatten_spec(([pred, x], {}), self._in_spec)
         l_x_ = arg1
 
-        cos: "f32[s1, s2]" = l_x_.cos();  l_x_ = None
+        cos: "f32[s77, s27]" = l_x_.cos();  l_x_ = None
         return pytree.tree_unflatten([cos], self._out_spec)
 """
         true_guard_code = [
 
@@ -2655,7 +2655,7 @@ def forward(self, L_x_: "f32[3]"):
                 normalize_gm(backend.graphs[0].print_readable(print_output=False)),
                 """\
 class GraphModule(torch.nn.Module):
-    def forward(self, s0: "Sym(s0)", L_x_: "f32[s0]"):
+    def forward(self, s77: "Sym(s77)", L_x_: "f32[s77]"):
         l_x_ = L_x_
 
         sum_1: "f32[]" = l_x_.sum();  l_x_ = None
@@ -2885,13 +2885,13 @@ def forward(self, L_lambda0_keywords_y_: "f32[2, 2]"):
                 normalize_gm(backend.graphs[0].print_readable(print_output=False)),
                 """\
 class GraphModule(torch.nn.Module):
-    def forward(self, s0: "Sym(s0)", L_lambda0_keywords_y_: "f32[s0, s0]"):
+    def forward(self, s9: "Sym(s9)", L_lambda0_keywords_y_: "f32[s9, s9]"):
         l_lambda0_keywords_y_ = L_lambda0_keywords_y_
 
-        mul: "f32[s0, s0]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_
-        mul_1: "f32[s0, s0]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_;  l_lambda0_keywords_y_ = None
+        mul: "f32[s9, s9]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_
+        mul_1: "f32[s9, s9]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_;  l_lambda0_keywords_y_ = None
 
-        mul_2: "f32[s0, s0]" = torch.mul(mul, mul_1);  mul = mul_1 = None
+        mul_2: "f32[s9, s9]" = torch.mul(mul, mul_1);  mul = mul_1 = None
         return (mul_2,)
 """,
             )
@@ -2932,14 +2932,14 @@ def forward(self, L_lambda0_keywords_y_: "f32[2, 2]"):
                 normalize_gm(backend.graphs[0].print_readable(print_output=False)),
                 """\
 class GraphModule(torch.nn.Module):
-    def forward(self, s0: "Sym(s0)", L_lambda0_keywords_y_: "f32[s0, s0]"):
+    def forward(self, s9: "Sym(s9)", L_lambda0_keywords_y_: "f32[s9, s9]"):
         l_lambda0_keywords_y_ = L_lambda0_keywords_y_
 
-        mul: "f32[s0, s0]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_
+        mul: "f32[s9, s9]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_
 
-        add: "f32[s0, s0]" = l_lambda0_keywords_y_ + l_lambda0_keywords_y_;  l_lambda0_keywords_y_ = None
+        add: "f32[s9, s9]" = l_lambda0_keywords_y_ + l_lambda0_keywords_y_;  l_lambda0_keywords_y_ = None
 
-        mul_1: "f32[s0, s0]" = torch.mul(mul, add);  mul = add = None
+        mul_1: "f32[s9, s9]" = torch.mul(mul, add);  mul = add = None
         return (mul_1,)
 """,
             )
@@ -2982,14 +2982,14 @@ def forward(self, L_lambda0_keywords_y_: "f32[2, 2]"):
                 normalize_gm(backend.graphs[0].print_readable(print_output=False)),
                 """\
 class GraphModule(torch.nn.Module):
-    def forward(self, s0: "Sym(s0)", L_lambda0_keywords_y_: "f32[s0, s0]"):
+    def forward(self, s9: "Sym(s9)", L_lambda0_keywords_y_: "f32[s9, s9]"):
         l_lambda0_keywords_y_ = L_lambda0_keywords_y_
 
-        mul: "f32[s0, s0]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_
+        mul: "f32[s9, s9]" = l_lambda0_keywords_y_ * l_lambda0_keywords_y_
 
-        add: "f32[s0, s0]" = l_lambda0_keywords_y_ + l_lambda0_keywords_y_;  l_lambda0_keywords_y_ = None
+        add: "f32[s9, s9]" = l_lambda0_keywords_y_ + l_lambda0_keywords_y_;  l_lambda0_keywords_y_ = None
 
-        mul_1: "f32[s0, s0]" = torch.mul(mul, add);  mul = add = None
+        mul_1: "f32[s9, s9]" = torch.mul(mul, add);  mul = add = None
         return (mul_1,)
 """,
             )
@@ -3029,14 +3029,14 @@ def forward(self, L_x_: "f32[2, 2]"):
                 normalize_gm(backend.graphs[0].print_readable(print_output=False)),
                 """\
 class GraphModule(torch.nn.Module):
-    def forward(self, s0: "Sym(s0)", L_x_: "f32[s0, s0]"):
+    def forward(self, s77: "Sym(s77)", L_x_: "f32[s77, s77]"):
         l_x_ = L_x_
 
-        mul: "f32[s0, s0]" = l_x_ * 4
-        mul_1: "f32[s0, s0]" = mul * l_x_;  mul = None
-        mul_2: "f32[s0, s0]" = 20 * l_x_;  l_x_ = None
+        mul: "f32[s77, s77]" = l_x_ * 4
+        mul_1: "f32[s77, s77]" = mul * l_x_;  mul = None
+        mul_2: "f32[s77, s77]" = 20 * l_x_;  l_x_ = None
 
-        mul_3: "f32[s0, s0]" = torch.mul(mul_1, mul_2);  mul_1 = mul_2 = None
+        mul_3: "f32[s77, s77]" = torch.mul(mul_1, mul_2);  mul_1 = mul_2 = None
         return (mul_3,)
 """,
             )