diff --git a/olmocr/train/configs/qwen25_vl_olmocrv3_rotation_2epoch.yaml b/olmocr/train/configs/qwen25_vl_olmocrv3_rotation_2epoch.yaml index c62e88a..8a13a01 100644 --- a/olmocr/train/configs/qwen25_vl_olmocrv3_rotation_2epoch.yaml +++ b/olmocr/train/configs/qwen25_vl_olmocrv3_rotation_2epoch.yaml @@ -2,7 +2,7 @@ # Project metadata project_name: olmocr-qwen-vl-training -run_name: qwen2.5-vl-7b-olmocrv3_2epoch_prompt_first_rotation +run_name: qwen2.5-vl-7b-olmocrv3_2epoch_prompt_first_rotation_fixed # Model configuration model: @@ -60,7 +60,7 @@ dataset: # Training configuration training: output_dir: /weka/oe-data-default/jakep/olmocr-trainer/ - num_train_epochs: 1 + num_train_epochs: 2 # Batch size and accumulation per_device_train_batch_size: 1