mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-15 03:10:35 +08:00
fix bug
This commit is contained in:
@@ -199,7 +199,7 @@ def _prepare_model_for_training(
|
|||||||
logger.info("Upcasting layernorm weights in float32.")
|
logger.info("Upcasting layernorm weights in float32.")
|
||||||
|
|
||||||
if not model_args.disable_gradient_checkpointing:
|
if not model_args.disable_gradient_checkpointing:
|
||||||
if getattr(model, "supports_gradient_checkpointing", False):
|
if not getattr(model, "supports_gradient_checkpointing", False):
|
||||||
logger.warning("Current model does not support gradient checkpointing.")
|
logger.warning("Current model does not support gradient checkpointing.")
|
||||||
else:
|
else:
|
||||||
model.enable_input_require_grads()
|
model.enable_input_require_grads()
|
||||||
|
|||||||
Reference in New Issue
Block a user