This commit is contained in:
Jake Poznanski 2025-06-12 21:29:39 +00:00
parent 59e0a1ccb0
commit fc06797bec

View File

@ -149,7 +149,7 @@ if has_aws_creds:
perf_commands.extend([
f"pip install marker-pdf=={marker_version}",
"pip install --upgrade torchvision",
"s5cmd cp s3://ai2-oe-data/jakep/olmocr/olmOCR-mix-0225/benchmark_set/* /root/olmOCR-mix-0225_benchmark_set/",
"aws s3 cp --recursive s3://ai2-oe-data/jakep/olmocr/olmOCR-mix-0225/benchmark_set/ /root/olmOCR-mix-0225_benchmark_set/",
"time marker --force_ocr /root/olmOCR-mix-0225_benchmark_set/ --output_dir /root/olmOCR-mix-0225_benchmark_set_marker --workers 8"
])