Bug Fix: off is parsed as False in yaml file, changed to disabled to avoid this.

This commit is contained in:
stceum
2024-06-24 20:39:20 +08:00
parent 5b897e7c35
commit 3ed063f281
3 changed files with 6 additions and 2 deletions

View File

@@ -97,7 +97,7 @@ class ModelArguments:
default=None,
metadata={"help": "Which scaling strategy should be adopted for the RoPE embeddings."},
)
flash_attn: Literal["off", "sdpa", "fa2", "auto"] = field(
flash_attn: Literal["disabled", "sdpa", "fa2", "auto"] = field(
default="auto",
metadata={"help": "Enable FlashAttention for faster training and inference."},
)