Skip to content

Commit a326b13

Browse files
committed
Move add_add_bos_token to set_vocab
1 parent 57201cc commit a326b13

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

convert_hf_to_gguf.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2949,6 +2949,9 @@ def get_vocab_base(self) -> tuple[list[str], list[int], str]:
29492949
def set_vocab(self):
29502950
self._set_vocab_gpt2()
29512951

2952+
# LLaDA specific parameters
2953+
self.gguf_writer.add_add_bos_token(True)
2954+
29522955
def set_gguf_parameters(self):
29532956
super().set_gguf_parameters()
29542957
self._try_set_pooling_type()
@@ -2977,8 +2980,7 @@ def set_gguf_parameters(self):
29772980
# LLaDA models use non-causal attention for diffusion, similar to Dream
29782981
self.gguf_writer.add_causal_attention(False)
29792982

2980-
# LLaDA specific parameters
2981-
self.gguf_writer.add_add_bos_token(True)
2983+
# LLaDA models don't shift their logits
29822984
self.gguf_writer.add_diffusion_shift_logits(False)
29832985

29842986
@staticmethod

0 commit comments

Comments
 (0)