debug

yeyu-nvidia · yeyu-nvidia · commit 5c4c8a0cbb3b · 2025-09-26T14:08:36.000-07:00
Signed-off-by: Ye Yu &lt;yeyu@nvidia.com&gt;
diff --git a/modelopt/torch/speculative/plugins/megatron_eagle.py b/modelopt/torch/speculative/plugins/megatron_eagle.py
@@ -781,16 +781,6 @@ def _get_eagle_module_inputs(
         eagle_inputs = {}
 
         eagle_inputs["position_ids"] = position_ids
-        eagle_inputs["rotary_pos_emb"] = rotary_pos_emb
-
-        if self.config.sequence_parallel:
-            gathered_hidden_states = gather_from_sequence_parallel_region(hidden_states)
-            gathered_features = (
-                None if features is None else gather_from_sequence_parallel_region(features)
-            )
-        else:
-            gathered_hidden_states = hidden_states
-            gathered_features = features
 
         eagle_inputs["input_ids"] = (
             padded_input_ids
@@ -803,6 +793,14 @@ def _get_eagle_module_inputs(
             )
         )
 
+        if self.config.sequence_parallel:
+            gathered_hidden_states = gather_from_sequence_parallel_region(hidden_states)
+            gathered_features = (
+                None if features is None else gather_from_sequence_parallel_region(features)
+            )
+        else:
+            gathered_hidden_states = hidden_states
+            gathered_features = features
         if gathered_features is not None:
             feature = gathered_features[-s:]
         eagle_inputs["hidden_states"] = (
@@ -829,6 +827,12 @@ def _get_eagle_module_inputs(
             attn_mask, (ttt_step - 1) * self.eagle_config.parallel_draft_step + parallel_draft_step
         )
 
+        eagle_inputs["rotary_pos_emb"] = torch.cat(
+            [rotary_pos_emb]
+            * ((ttt_step - 1) * self.eagle_config.parallel_draft_step + parallel_draft_step),
+            dim=0,
+        )
+
         eagle_inputs["embedding"] = self.embedding(
             input_ids=eagle_inputs["input_ids"],
             position_ids=eagle_inputs["position_ids"],