From e141c91e5edccf94e27530d863f7092f5f07e193 Mon Sep 17 00:00:00 2001 From: Jake Poznanski Date: Thu, 17 Oct 2024 17:12:35 +0000 Subject: [PATCH] Try lora run higher LR --- pdelfin/train/config/qwen2vl-7b-lora.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pdelfin/train/config/qwen2vl-7b-lora.yaml b/pdelfin/train/config/qwen2vl-7b-lora.yaml index aaa471e..fb7a64f 100644 --- a/pdelfin/train/config/qwen2vl-7b-lora.yaml +++ b/pdelfin/train/config/qwen2vl-7b-lora.yaml @@ -46,7 +46,7 @@ hparams: gradient_accumulation_steps: 4 gradient_checkpointing: true clip_grad_norm: 1.0 - learning_rate: 1e-4 + learning_rate: 3e-4 max_steps: 10000 pad_multiple_of: 16 log_every_steps: 10