Former-commit-id: 300ecf9b9d7fd99fbb68f3d086e3ad973c2f894e
This commit is contained in:
hiyouga 2024-01-21 14:11:38 +08:00
parent 7abc3065fb
commit 96531a0ef8

View File

@ -223,6 +223,7 @@ def _prepare_model_for_training(
logger.warning("Current model does not support gradient checkpointing.")
else:
model.gradient_checkpointing_enable(gradient_checkpointing_kwargs={"use_reentrant": False})
model.enable_input_require_grads()
model.config.use_cache = False # turn off when gradient checkpointing is enabled
logger.info("Gradient checkpointing enabled.")