move efficient_packing from data_args to model_args

Former-commit-id: 7b61659c707480bcf8c802c73e10d12ad5b9b965
2025-12-17 12:20:37 +08:00 · 2024-07-02 18:37:55 +07:00
parent 9174675ba9
commit 260f55ea47
8 changed files with 20 additions and 18 deletions
--- a/src/llamafactory/hparams/model_args.py
+++ b/src/llamafactory/hparams/model_args.py
@@ -109,6 +109,12 @@ class ModelArguments:
        default=False,
        metadata={"help": "Enable shift short attention (S^2-Attn) proposed by LongLoRA."},
    )
+    efficient_packing: Optional[bool] = field(
+        default=None,
+        metadata={
+            "help": "Whether or not to pack the sequences without cross-contamination attention for efficient training."
+        },
+    )
    mixture_of_depths: Optional[Literal["convert", "load"]] = field(
        default=None,
        metadata={"help": "Convert the model to mixture-of-depths (MoD) or load the MoD model."},