resolve gradient checkpointing issue.

This commit is contained in:
Jonery
2024-04-16 12:05:27 +08:00
parent 06c8908d3f
commit 7ecb61822b
4 changed files with 8 additions and 14 deletions

View File

@@ -31,6 +31,5 @@ python ../../../src/train_bash.py \
--use_badam \
--switch_mode descending \
--badam_verbose 2 \
--switch_block_every 50 \
--pure_bf16 \
--switch_block_every 50