add moe aux loss control #3085

Former-commit-id: b267aeb53f
2026-03-09 05:05:59 +08:00 · 2024-04-02 14:26:31 +08:00
parent c7104f8fab
commit f4be51f356
4 changed files with 23 additions and 16 deletions
--- a/src/llmtuner/hparams/model_args.py
+++ b/src/llmtuner/hparams/model_args.py
@@ -73,6 +73,10 @@ class ModelArguments:
        default=False,
        metadata={"help": "Whether or not to use unsloth's optimization for the LoRA training."},
    )
+    moe_aux_loss_coef: Optional[float] = field(
+        default=None,
+        metadata={"help": "Coefficient of the auxiliary router loss in mixture-of-experts model."},
+    )
    disable_gradient_checkpointing: bool = field(
        default=False,
        metadata={"help": "Whether or not to disable gradient checkpointing."},