diff --git a/dev/runcpu.sh b/dev/runcpu.sh index 2d73dfc..e5c7ea8 100644 --- a/dev/runcpu.sh +++ b/dev/runcpu.sh @@ -53,7 +53,7 @@ python -m scripts.base_train \ --sample_every=50 \ --num_iterations=50 python -m scripts.base_loss --device_batch_size=1 --split_tokens=4096 -python -m scripts.base_eval --max-per-task=5 +python -m scripts.base_eval --max-per-task=16 # midtraining python -m scripts.mid_train \