resolve gradient checkpointing issue.

Former-commit-id: 6df9135d063bb6102f0cbcdf0d702076f5febbae
This commit is contained in:
Jonery
2024-04-16 12:05:27 +08:00
parent 22188f1fa3
commit 2ba03e6ef3
4 changed files with 8 additions and 14 deletions

View File

@@ -31,6 +31,5 @@ python ../../../src/train_bash.py \
--use_badam \
--switch_mode descending \
--badam_verbose 2 \
--switch_block_every 50 \
--pure_bf16 \
--switch_block_every 50