mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-08-04 12:42:51 +08:00
fix baichuan resize
Former-commit-id: f4657de7d574fdab5d164c679bd474d35140894a
This commit is contained in:
parent
2e42e38ff2
commit
e3e86340ec
@ -188,6 +188,10 @@ def resize_embedding_layer(model: "PreTrainedModel", tokenizer: "PreTrainedToken
|
|||||||
r"""
|
r"""
|
||||||
Resize token embeddings.
|
Resize token embeddings.
|
||||||
"""
|
"""
|
||||||
|
if not isinstance(model.get_output_embeddings(), torch.nn.Linear):
|
||||||
|
logger.warning("Current model does not support resizing token embeddings.")
|
||||||
|
return
|
||||||
|
|
||||||
old_vocab_size = model.get_input_embeddings().weight.size(0)
|
old_vocab_size = model.get_input_embeddings().weight.size(0)
|
||||||
if len(tokenizer) != old_vocab_size:
|
if len(tokenizer) != old_vocab_size:
|
||||||
model.resize_token_embeddings(len(tokenizer), pad_to_multiple_of=64)
|
model.resize_token_embeddings(len(tokenizer), pad_to_multiple_of=64)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user