implement efficient packing without cross-contamination attention

Former-commit-id: b2c367bc61
2026-03-08 12:46:06 +08:00 · 2024-06-12 11:56:01 +07:00
parent 1a261add61
commit 045eb155a2
9 changed files with 287 additions and 8 deletions
--- a/src/llamafactory/hparams/data_args.py
+++ b/src/llamafactory/hparams/data_args.py
@@ -84,6 +84,10 @@ class DataArguments:
            "help": "Whether or not to pack the sequences in training. Will automatically enable in pre-training."
        },
    )
+    efficient_packing: Optional[bool] = field(
+        default=None,
+        metadata={"help": "Whether or not to pack the sequences without cross-contamination attention for efficient training."},
+    )
    tokenized_path: Optional[str] = field(
        default=None,
        metadata={"help": "Path to save or load the tokenized datasets."},