mirror of
https://github.com/allenai/olmocr.git
synced 2025-08-31 12:25:54 +00:00
Put LR back, need to save larger checkpoints to weka to prevent timeouts
This commit is contained in:
parent
e141c91e5e
commit
529d51d57d
@ -46,7 +46,7 @@ hparams:
|
|||||||
gradient_accumulation_steps: 4
|
gradient_accumulation_steps: 4
|
||||||
gradient_checkpointing: true
|
gradient_checkpointing: true
|
||||||
clip_grad_norm: 1.0
|
clip_grad_norm: 1.0
|
||||||
learning_rate: 3e-4
|
learning_rate: 1e-4
|
||||||
max_steps: 10000
|
max_steps: 10000
|
||||||
pad_multiple_of: 16
|
pad_multiple_of: 16
|
||||||
log_every_steps: 10
|
log_every_steps: 10
|
||||||
|
@ -10,7 +10,7 @@ then
|
|||||||
fi
|
fi
|
||||||
|
|
||||||
|
|
||||||
EXTRA_ARGS="-c pdelfin/train/config/qwen2vl-7b.yaml --num_proc 64 --save.path \"s3://ai2-oe-data/jakep/experiments/qwen2vl-pdf/v1/models/\${BEAKER_USER_ID}\""
|
EXTRA_ARGS="-c pdelfin/train/config/qwen2vl-7b.yaml --num_proc 64 --save.path \"/data/jakep/experiments/qwen2vl-pdf/v1/models/\${BEAKER_USER_ID}\""
|
||||||
|
|
||||||
run_name=$(basename "$0" .sh)
|
run_name=$(basename "$0" .sh)
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user