File tree Expand file tree Collapse file tree 1 file changed +10
-0
lines changed Expand file tree Collapse file tree 1 file changed +10
-0
lines changed Original file line number Diff line number Diff line change @@ -197,6 +197,16 @@ def _try_load_from_tokenizer_json(self, path: Path) -> bool:
197197 if special_last := tmpl_single [- 1 ].get ('SpecialToken' , {}).get ('id' ):
198198 if not tokenizer_config :
199199 special_eos = special_last
200+ elif special_last != special_eos :
201+ if 'eot' not in self .special_token_types :
202+ self .special_token_types = tuple (self .special_token_types ) + ('eot' , )
203+ tokenizer_config ['eot_token' ] = special_eos
204+ elif 'eom' not in self .special_token_types :
205+ self .special_token_types = tuple (self .special_token_types ) + ('eom' , )
206+ tokenizer_config ['eom_token' ] = special_eos
207+ else :
208+ logger .warning (f'Overriding EOS token { special_eos !r} with { special_last !r} without EOT/EOM fallback!' )
209+ tokenizer_config ['eos_token' ] = special_eos = special_last
200210 self .add_special_token ['eos' ] = True if special_last == special_eos else False
201211 if special_last != special_eos :
202212 logger .warning (f'Unknown trailing special token { special_last !r} in TemplateProcessing<single>' )
You can’t perform that action at this time.
0 commit comments