mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2026-03-04 02:35:59 +08:00
[v1] support training with fsdp2 (#9773)
Co-authored-by: frozenleaves <frozen@Mac.local> Co-authored-by: Yaowei Zheng <hiyouga@buaa.edu.cn>
This commit is contained in:
@@ -20,7 +20,7 @@ from typing import Any
|
||||
from omegaconf import OmegaConf
|
||||
from transformers import HfArgumentParser
|
||||
|
||||
from ...extras.misc import is_env_enabled
|
||||
from ..utils.env import is_env_enabled
|
||||
from .data_args import DataArguments
|
||||
from .model_args import ModelArguments
|
||||
from .sample_args import SampleArguments
|
||||
|
||||
@@ -45,6 +45,10 @@ class TrainingArguments:
|
||||
default=3,
|
||||
metadata={"help": "Number of training epochs."},
|
||||
)
|
||||
max_steps: int | None = field(
|
||||
default=None,
|
||||
metadata={"help": "Maximum number of training steps. If set, overrides num_train_epochs."},
|
||||
)
|
||||
max_grad_norm: float = field(
|
||||
default=1.0,
|
||||
metadata={"help": "Maximum gradient norm for training."},
|
||||
|
||||
Reference in New Issue
Block a user