We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent dc27788 commit f8dc859Copy full SHA for f8dc859
modelopt/torch/speculative/plugins/megatron_eagle.py
@@ -1284,7 +1284,9 @@ def forward(
1284
1285
# If eagle_freeze_base_model is set to True,
1286
# the base model is frozen .
1287
- loss = self.compute_language_model_loss(labels, logits_sbh)
+ loss = self.compute_language_model_loss(
1288
+ labels, logits_sbh[:-1] if self.eagle_offline else logits_sbh
1289
+ )
1290
loss = 0.0 * loss
1291
1292
if self.eagle_config.parallel_draft_step > 1:
0 commit comments