fix ppo runtime error

2025-12-15 11:20:35 +08:00 · 2024-03-08 11:48:26 +08:00
parent 4a2cc60b94
commit cdb7f82869
2 changed files with 4 additions and 2 deletions
--- a/src/llmtuner/model/patcher.py
+++ b/src/llmtuner/model/patcher.py
@@ -264,6 +264,7 @@ def patch_config(
    config: "PretrainedConfig",
    tokenizer: "PreTrainedTokenizer",
    model_args: "ModelArguments",
+    finetuning_args: "FinetuningArguments",
    init_kwargs: Dict[str, Any],
    is_trainable: bool,
 ) -> None:
@@ -288,7 +289,8 @@ def patch_config(
    if not is_deepspeed_zero3_enabled():
        init_kwargs["low_cpu_mem_usage"] = model_args.low_cpu_mem_usage
        if "device_map" not in init_kwargs:  # quant models cannot use auto device map
-            init_kwargs["device_map"] = model_args.device_map or {"": get_current_device()}
+            if finetuning_args.stage not in ["ppo"]: #ppo stage should not set device map
+                init_kwargs["device_map"] = model_args.device_map or {"": get_current_device()}


 def patch_model(