diff --git a/src/llamafactory/train/ksft/workflow.py b/src/llamafactory/train/ksft/workflow.py index 740439e7..5478a437 100644 --- a/src/llamafactory/train/ksft/workflow.py +++ b/src/llamafactory/train/ksft/workflow.py @@ -83,6 +83,7 @@ def run_sft( **dataset_module, **metric_module, ) + trainer.model_accepts_loss_kwargs = False # Training if training_args.do_train: