Temporarily patch an issue with the dependency parser so that it doesn't produce <PAD> as a relation

AngledLuffa · AngledLuffa · commit 284e9b4397eb · 2026-02-25T10:16:40.000-08:00
diff --git a/stanza/models/depparse/trainer.py b/stanza/models/depparse/trainer.py
@@ -18,6 +18,7 @@
 from stanza.models.common.foundation_cache import load_bert, load_bert_with_peft, NoTransformerFoundationCache
 from stanza.models.common.chuliu_edmonds import chuliu_edmonds_one_root
 from stanza.models.common.peft_config import build_peft_wrapper, load_peft_wrapper
+from stanza.models.common.vocab import VOCAB_PREFIX_SIZE
 from stanza.models.depparse.model import Parser
 from stanza.models.pos.vocab import MultiVocab
 
@@ -73,6 +74,8 @@ def __init__(self, args=None, vocab=None, pretrain=None, model_file=None,
             self.model = self.model.to(device)
             self.__init_optim()
 
+        self.fallback = self.vocab['deprel'].unit2id('dep') if 'dep' in self.vocab['deprel'] else None
+
         if ignore_model_config:
             self.args = orig_args
 
@@ -147,6 +150,9 @@ def predict(self, batch, unsort=True):
         self.model.eval()
         batch_size = word.size(0)
         _, preds = self.model(word, word_mask, wordchars, wordchars_mask, upos, xpos, ufeats, pretrained, lemma, head, deprel, word_orig_idx, sentlens, wordlens, text)
+        # TODO: would be cleaner for the model to not have the capability to produce predictions < VOCAB_PREFIX_SIZE
+        if self.fallback is not None:
+            preds[1][preds[1] < VOCAB_PREFIX_SIZE] = self.fallback
         head_seqs = [chuliu_edmonds_one_root(adj[:l, :l])[1:] for adj, l in zip(preds[0], sentlens)] # remove attachment for the root
         deprel_seqs = [self.vocab['deprel'].unmap([preds[1][i][j+1][h] for j, h in enumerate(hs)]) for i, hs in enumerate(head_seqs)]