Bug Fix: off is parsed as False in yaml file, changed to disabled to avoid this.

Former-commit-id: 171289d8e4c111fdca2b100282b64c74a04a4726
This commit is contained in:
stceum
2024-06-24 20:39:20 +08:00
parent c173a1e9ca
commit 0bf750ade8
3 changed files with 6 additions and 2 deletions

View File

@@ -97,7 +97,7 @@ class ModelArguments:
default=None,
metadata={"help": "Which scaling strategy should be adopted for the RoPE embeddings."},
)
flash_attn: Literal["off", "sdpa", "fa2", "auto"] = field(
flash_attn: Literal["disabled", "sdpa", "fa2", "auto"] = field(
default="auto",
metadata={"help": "Enable FlashAttention for faster training and inference."},
)