File tree Expand file tree Collapse file tree 1 file changed +10
-0
lines changed Expand file tree Collapse file tree 1 file changed +10
-0
lines changed Original file line number Diff line number Diff line change @@ -197,6 +197,16 @@ def _try_load_from_tokenizer_json(self, path: Path) -> bool:
197
197
if special_last := tmpl_single [- 1 ].get ('SpecialToken' , {}).get ('id' ):
198
198
if not tokenizer_config :
199
199
special_eos = special_last
200
+ elif special_last != special_eos :
201
+ if 'eot' not in self .special_token_types :
202
+ self .special_token_types = tuple (self .special_token_types ) + ('eot' , )
203
+ tokenizer_config ['eot_token' ] = special_eos
204
+ elif 'eom' not in self .special_token_types :
205
+ self .special_token_types = tuple (self .special_token_types ) + ('eom' , )
206
+ tokenizer_config ['eom_token' ] = special_eos
207
+ else :
208
+ logger .warning (f'Overriding EOS token { special_eos !r} with { special_last !r} without EOT/EOM fallback!' )
209
+ tokenizer_config ['eos_token' ] = special_eos = special_last
200
210
self .add_special_token ['eos' ] = True if special_last == special_eos else False
201
211
if special_last != special_eos :
202
212
logger .warning (f'Unknown trailing special token { special_last !r} in TemplateProcessing<single>' )
You can’t perform that action at this time.
0 commit comments