diff --git a/pdelfin/train/config/molmo-o-lora.yaml b/pdelfin/train/config/molmo-o-lora.yaml index f6d731b..01ed1b6 100644 --- a/pdelfin/train/config/molmo-o-lora.yaml +++ b/pdelfin/train/config/molmo-o-lora.yaml @@ -16,22 +16,22 @@ train_data: sources: - name: openai_batch_data_v5_1_train response_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_train_done/*.json - target_longest_image_dim: 1024 - target_anchor_text_len: 6000 + target_longest_image_dim: [1024] + target_anchor_text_len: [6000] - name: openai_batch_data_v5_1_iabooks_train response_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_iabooks_train_done/*.json - target_longest_image_dim: 1024 - target_anchor_text_len: 6000 + target_longest_image_dim: [1024] + target_anchor_text_len: [6000] valid_data: cache_location: /data/jakep/pdfdata/pdelfin_cache - metric_for_best_model: openai_batch_data_v5_1_iabooks_eval + metric_for_best_model: openai_batch_data_v5_1_eval_loss sources: # These tend to be small, so you can load from s3 it's no big deal - name: openai_batch_data_v5_1_eval response_glob_path: s3://ai2-oe-data/jakep/pdfdata/openai_batch_done_v5_1_eval/*.json - target_longest_image_dim: 1024 - target_anchor_text_len: 6000 + target_longest_image_dim: [1024] + target_anchor_text_len: [6000] - name: openai_batch_data_v5_1_eval response_glob_path: s3://ai2-oe-data/jakep/pdfdata/openai_batch_done_v5_1_eval/*.json target_longest_image_dim: [1024] diff --git a/pdelfin/train/config/qwen2vl-7b.yaml b/pdelfin/train/config/qwen2vl-7b.yaml index 0a7c1c8..7642964 100644 --- a/pdelfin/train/config/qwen2vl-7b.yaml +++ b/pdelfin/train/config/qwen2vl-7b.yaml @@ -17,11 +17,11 @@ train_data: - name: openai_batch_data_v5_1_train response_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_train_done/*.json target_longest_image_dim: [1024] - target_anchor_text_len: [0, 6000, 6000, 6000, 6000, 6000, 6000, 6000, 6000, 6000] + target_anchor_text_len: [6000] - name: openai_batch_data_v5_1_iabooks_train response_glob_path: /data/jakep/pdfdata/openai_batch_data_v5_1_iabooks_train_done/*.json target_longest_image_dim: [1024] - target_anchor_text_len: [0, 6000, 6000, 6000, 6000, 6000, 6000, 6000, 6000, 6000] + target_anchor_text_len: [6000] valid_data: cache_location: /data/jakep/pdfdata/pdelfin_cache