From 798335c88e39801a3f7601cbf5480b44ed42152f Mon Sep 17 00:00:00 2001 From: Jake Poznanski Date: Tue, 19 Aug 2025 17:46:23 +0000 Subject: [PATCH] Setting pipeline touse new prompt too --- olmocr/pipeline.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/olmocr/pipeline.py b/olmocr/pipeline.py index 640a0aa..1dfa9bc 100644 --- a/olmocr/pipeline.py +++ b/olmocr/pipeline.py @@ -37,7 +37,7 @@ from olmocr.data.renderpdf import render_pdf_to_base64png from olmocr.filter.filter import Language, PdfFilter from olmocr.image_utils import convert_image_to_pdf_bytes, is_jpeg, is_png from olmocr.metrics import MetricsKeeper, WorkerTracker -from olmocr.prompts import PageResponse, build_no_anchoring_yaml_prompt +from olmocr.prompts import PageResponse, build_no_anchoring_v4_yaml_prompt from olmocr.prompts.anchor import get_anchor_text from olmocr.s3_utils import ( download_directory, @@ -137,7 +137,7 @@ async def build_page_query(local_pdf_path: str, page: int, target_longest_image_ { "role": "user", "content": [ - {"type": "text", "text": build_no_anchoring_yaml_prompt()}, + {"type": "text", "text": build_no_anchoring_v4_yaml_prompt()}, {"type": "image_url", "image_url": {"url": f"data:image/png;base64,{image_base64}"}}, ], }