Dealing with issue with molmo unused params

This commit is contained in:
Jake Poznanski 2025-01-24 16:27:42 +00:00
parent dabecd9ef0
commit d0eea81c00
3 changed files with 4 additions and 3 deletions

View File

@ -46,6 +46,7 @@ hparams:
eval_batch_size: 1
gradient_accumulation_steps: 4
gradient_checkpointing: true
find_unused_parameters: true
clip_grad_norm: 1.0
learning_rate: 1e-4
max_steps: 10000

View File

@ -46,6 +46,7 @@ hparams:
eval_batch_size: 1
gradient_accumulation_steps: 4
gradient_checkpointing: true
find_unused_parameters: true
clip_grad_norm: 1.0
learning_rate: 1e-4
max_steps: 10000

View File

@ -22,8 +22,8 @@ run_name=$(basename "$0" .sh)
CLUSTER='jupiter'
gantry run \
--description "${run_name}"\
--task-name "${run_name}"\
--description "${run_name}-4096"\
--task-name "${run_name}-4096"\
--allow-dirty \
--host-networking \
--workspace ai2/oe-data-model-based-cleanup \
@ -32,7 +32,6 @@ gantry run \
--pip gantry-requirements.txt \
--priority high \
--gpus 8 \
--preemptible \
--cluster "ai2/${CLUSTER}*" \
--budget ai2/oe-data \
--weka "oe-data-default:/data" \