mirror of
https://github.com/allenai/olmocr.git
synced 2025-11-15 18:08:41 +00:00
Small config updates
This commit is contained in:
parent
ee8bd9b220
commit
a3ad61bd4d
@ -8,20 +8,20 @@ run_name: qwen2.5-vl-7b-finetune
|
|||||||
model:
|
model:
|
||||||
name: Qwen/Qwen2.5-VL-7B-Instruct
|
name: Qwen/Qwen2.5-VL-7B-Instruct
|
||||||
trust_remote_code: true
|
trust_remote_code: true
|
||||||
torch_dtype: auto
|
torch_dtype: bfloat16
|
||||||
use_flash_attention: true
|
use_flash_attention: true
|
||||||
attn_implementation: flash_attention_2
|
attn_implementation: flash_attention_2
|
||||||
|
|
||||||
# LoRA settings (disabled by default)
|
# LoRA settings (disabled by default)
|
||||||
use_lora: false
|
use_lora: false
|
||||||
lora_rank: 8
|
# lora_rank: 8
|
||||||
lora_alpha: 32
|
# lora_alpha: 32
|
||||||
lora_dropout: 0.1
|
# lora_dropout: 0.1
|
||||||
lora_target_modules:
|
# lora_target_modules:
|
||||||
- q_proj
|
# - q_proj
|
||||||
- v_proj
|
# - v_proj
|
||||||
- k_proj
|
# - k_proj
|
||||||
- o_proj
|
# - o_proj
|
||||||
|
|
||||||
# Dataset configuration
|
# Dataset configuration
|
||||||
dataset:
|
dataset:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user