test fix

yaoyu-33 · yaoyu-33 · commit 645ff38e98a7 · 2026-01-21T14:46:48.000-08:00
Signed-off-by: yaoyu-33 &lt;yaoyu.094@gmail.com&gt;
diff --git a/tests/functional_tests/training/test_decentralized_pg.py b/tests/functional_tests/training/test_decentralized_pg.py
@@ -111,6 +111,8 @@ def test_pretrain_with_decentralized_pg(self, tmp_path):
                 make_vocab_size_divisible_by=128,
                 vocab_size=None,
                 num_layers=1,
+                # Disable shared embeddings - not supported with decentralized PG
+                share_embeddings_and_output_weights=False,
             )
 
             # Config Container with use_decentralized_pg=True
@@ -366,6 +368,8 @@ def test_pretrain_with_decentralized_pg_and_pp(self, tmp_path):
                 make_vocab_size_divisible_by=128,
                 vocab_size=None,
                 num_layers=2,  # Need at least 2 layers for PP=2
+                # Disable shared embeddings - not supported with decentralized PG
+                share_embeddings_and_output_weights=False,
             )
 
             # Config Container with use_decentralized_pg=True
@@ -496,6 +500,8 @@ def test_pretrain_with_decentralized_pg_and_cp(self, tmp_path):
                 make_vocab_size_divisible_by=128,
                 vocab_size=None,
                 num_layers=1,
+                # Disable shared embeddings - not supported with decentralized PG
+                share_embeddings_and_output_weights=False,
             )
 
             # Config Container with use_decentralized_pg=True
@@ -626,6 +632,8 @@ def test_pretrain_with_decentralized_pg_combined_parallelism(self, tmp_path):
                 make_vocab_size_divisible_by=128,
                 vocab_size=None,
                 num_layers=2,  # Need at least 2 layers for PP=2
+                # Disable shared embeddings - not supported with decentralized PG
+                share_embeddings_and_output_weights=False,
             )
 
             # Config Container with use_decentralized_pg=True
@@ -756,6 +764,8 @@ def test_pretrain_with_decentralized_pg_and_tp(self, tmp_path):
                 make_vocab_size_divisible_by=128,
                 vocab_size=None,
                 num_layers=1,
+                # Disable shared embeddings - not supported with decentralized PG
+                share_embeddings_and_output_weights=False,
             )
 
             # Config Container with use_decentralized_pg=True