resolve gradient checkpointing issue.

Former-commit-id: 6df9135d063bb6102f0cbcdf0d702076f5febbae
This commit is contained in:
Jonery
2024-04-16 12:05:27 +08:00
parent d4d471450f
commit 6dd6b3e396
4 changed files with 8 additions and 14 deletions

View File

@@ -31,6 +31,5 @@ python ../../../src/train_bash.py \
--use_badam \
--switch_mode descending \
--badam_verbose 2 \
--switch_block_every 50 \
--pure_bf16 \
--switch_block_every 50