diff --git a/gantry-requirements.txt b/gantry-requirements.txt index 1a18079..6128533 100644 --- a/gantry-requirements.txt +++ b/gantry-requirements.txt @@ -30,6 +30,6 @@ peft wandb omegaconf s3fs -transformers==4.51.3 +transformers>=4.45.1 bitsandbytes ftfy diff --git a/scripts/qwen25vl-7b-gantry.sh b/scripts/qwen25vl-7b-gantry.sh index de8863b..7bd79f7 100755 --- a/scripts/qwen25vl-7b-gantry.sh +++ b/scripts/qwen25vl-7b-gantry.sh @@ -44,4 +44,4 @@ gantry run \ --env-secret WANDB_API_KEY=JAKE_WANDB_API_KEY \ --shared-memory 10GiB \ --yes \ - -- /bin/bash -c "source scripts/beaker/${CLUSTER}-ib.sh && python -m olmocr.train.loaddataset ${EXTRA_ARGS} && accelerate launch --use_fsdp --num_processes \${BEAKER_ASSIGNED_GPU_COUNT} --fsdp_offload_params false --fsdp_sharding_strategy FULL_SHARD --fsdp_auto_wrap_policy TRANSFORMER_BASED_WRAP --mixed_precision bf16 -m olmocr.train.train ${EXTRA_ARGS}" \ No newline at end of file + -- /bin/bash -c "pip install transformers==4.51.3 && source scripts/beaker/${CLUSTER}-ib.sh && python -m olmocr.train.loaddataset ${EXTRA_ARGS} && accelerate launch --use_fsdp --num_processes \${BEAKER_ASSIGNED_GPU_COUNT} --fsdp_offload_params false --fsdp_sharding_strategy FULL_SHARD --fsdp_auto_wrap_policy TRANSFORMER_BASED_WRAP --mixed_precision bf16 -m olmocr.train.train ${EXTRA_ARGS}" \ No newline at end of file