support baichuan model

2025-12-16 20:00:36 +08:00 · 2023-06-15 16:02:01 +08:00
parent c527399424
commit 0cee6ad67f
3 changed files with 10 additions and 1 deletions
--- a/src/utils/common.py
+++ b/src/utils/common.py
@@ -170,6 +170,8 @@ def load_pretrained(
        **config_kwargs
    )
    tokenizer.pad_token_id = 0 if tokenizer.pad_token_id is None else tokenizer.pad_token_id # set as the <unk> token
+    if tokenizer.pad_token_id == 64000:
+        tokenizer.pad_token_id = 0 # for baichuan model (need fix)

    config = AutoConfig.from_pretrained(model_args.model_name_or_path, **config_kwargs)
    is_mergeable = True