Script adjustment

This commit is contained in:
Jake Poznanski 2024-09-23 14:41:35 -07:00
parent 79feb986a6
commit a30ca16e1f
2 changed files with 16 additions and 15 deletions

View File

@ -62,19 +62,20 @@ hparams:
warmup_ratio: 0.03 warmup_ratio: 0.03
# From https://github.com/QwenLM/Qwen2/blob/main/examples/sft/finetune.py # From https://github.com/QwenLM/Qwen2/blob/main/examples/sft/finetune.py
lora: # Disable LORA for now, because we want the visual network to get trained too
rank: 32 # lora:
alpha: 32 # rank: 32
dropout: 0.05 # alpha: 32
task_type: causal_lm # dropout: 0.05
target_modules: # task_type: causal_lm
- q_proj # target_modules:
- k_proj # - q_proj
- v_proj # - k_proj
- o_proj # - v_proj
- gate_proj # - o_proj
- up_proj # - gate_proj
- down_proj # - up_proj
# - down_proj
save: save:
path: s3://ai2-oe-data/jakep/experiments/qwen2vl-pdf/v1/models/ path: s3://ai2-oe-data/jakep/experiments/qwen2vl-pdf/v1/models/

View File

@ -29,8 +29,8 @@ gantry run \
--workspace ai2/oe-data-pdf \ --workspace ai2/oe-data-pdf \
--beaker-image 'lucas/refine-axelot-vllm' \ --beaker-image 'lucas/refine-axelot-vllm' \
--venv 'base' \ --venv 'base' \
--priority high \ --priority normal \
--gpus 8 \ --gpus 4 \
--preemptible \ --preemptible \
--cluster "ai2/${CLUSTER}*" \ --cluster "ai2/${CLUSTER}*" \
--budget ai2/oe-data \ --budget ai2/oe-data \