mirror of
https://github.com/allenai/olmocr.git
synced 2025-08-16 12:52:12 +00:00
Dealing with issue with molmo unused params
This commit is contained in:
parent
dabecd9ef0
commit
d0eea81c00
@ -46,6 +46,7 @@ hparams:
|
|||||||
eval_batch_size: 1
|
eval_batch_size: 1
|
||||||
gradient_accumulation_steps: 4
|
gradient_accumulation_steps: 4
|
||||||
gradient_checkpointing: true
|
gradient_checkpointing: true
|
||||||
|
find_unused_parameters: true
|
||||||
clip_grad_norm: 1.0
|
clip_grad_norm: 1.0
|
||||||
learning_rate: 1e-4
|
learning_rate: 1e-4
|
||||||
max_steps: 10000
|
max_steps: 10000
|
||||||
|
@ -46,6 +46,7 @@ hparams:
|
|||||||
eval_batch_size: 1
|
eval_batch_size: 1
|
||||||
gradient_accumulation_steps: 4
|
gradient_accumulation_steps: 4
|
||||||
gradient_checkpointing: true
|
gradient_checkpointing: true
|
||||||
|
find_unused_parameters: true
|
||||||
clip_grad_norm: 1.0
|
clip_grad_norm: 1.0
|
||||||
learning_rate: 1e-4
|
learning_rate: 1e-4
|
||||||
max_steps: 10000
|
max_steps: 10000
|
||||||
|
@ -22,8 +22,8 @@ run_name=$(basename "$0" .sh)
|
|||||||
CLUSTER='jupiter'
|
CLUSTER='jupiter'
|
||||||
|
|
||||||
gantry run \
|
gantry run \
|
||||||
--description "${run_name}"\
|
--description "${run_name}-4096"\
|
||||||
--task-name "${run_name}"\
|
--task-name "${run_name}-4096"\
|
||||||
--allow-dirty \
|
--allow-dirty \
|
||||||
--host-networking \
|
--host-networking \
|
||||||
--workspace ai2/oe-data-model-based-cleanup \
|
--workspace ai2/oe-data-model-based-cleanup \
|
||||||
@ -32,7 +32,6 @@ gantry run \
|
|||||||
--pip gantry-requirements.txt \
|
--pip gantry-requirements.txt \
|
||||||
--priority high \
|
--priority high \
|
||||||
--gpus 8 \
|
--gpus 8 \
|
||||||
--preemptible \
|
|
||||||
--cluster "ai2/${CLUSTER}*" \
|
--cluster "ai2/${CLUSTER}*" \
|
||||||
--budget ai2/oe-data \
|
--budget ai2/oe-data \
|
||||||
--weka "oe-data-default:/data" \
|
--weka "oe-data-default:/data" \
|
||||||
|
Loading…
x
Reference in New Issue
Block a user