mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-10-14 23:58:11 +08:00
fix qwen eos token
Former-commit-id: 770830c67886f5872b39b9608949ec62d4616b27
This commit is contained in:
parent
a70d56864e
commit
fe3b12d900
@ -68,7 +68,9 @@ def load_model_and_tokenizer(
|
||||
padding_side=model_args.padding_side,
|
||||
**config_kwargs
|
||||
)
|
||||
if tokenizer.pad_token_id is None or tokenizer.pad_token_id == 64000: # 64000 for baichuan model (older version)
|
||||
if tokenizer.eos_token_id is None: # fix qwen tokenizer
|
||||
tokenizer.eos_token = "<|endoftext|>"
|
||||
if tokenizer.pad_token_id is None: # add pad token
|
||||
tokenizer.pad_token = tokenizer.eos_token
|
||||
|
||||
config = AutoConfig.from_pretrained(model_args.model_name_or_path, **config_kwargs)
|
||||
|
Loading…
x
Reference in New Issue
Block a user