diff --git a/pdelfin/train/config/qwen2vl-7b.yaml b/pdelfin/train/config/qwen2vl-7b.yaml index f4f896d..3eb1e78 100644 --- a/pdelfin/train/config/qwen2vl-7b.yaml +++ b/pdelfin/train/config/qwen2vl-7b.yaml @@ -47,7 +47,7 @@ hparams: gradient_checkpointing: true clip_grad_norm: 1.0 learning_rate: 1e-6 - max_steps: 10000 + max_steps: 30000 pad_multiple_of: 16 log_every_steps: 10 eval_every_steps: 100 @@ -59,6 +59,6 @@ hparams: save: path: s3://ai2-oe-data/jakep/experiments/qwen2vl-pdf/v1/models/ - save_every_steps: 9500 + save_every_steps: 29500 max_workers: 10 \ No newline at end of file