From 2cb14cceaec50549e92f748e7cc09041668f1e58 Mon Sep 17 00:00:00 2001 From: Jake Poznanski Date: Thu, 29 May 2025 19:59:58 +0000 Subject: [PATCH] ALlowing more tokens --- olmocr/pipeline.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/olmocr/pipeline.py b/olmocr/pipeline.py index 577467a..e09e79e 100644 --- a/olmocr/pipeline.py +++ b/olmocr/pipeline.py @@ -106,7 +106,7 @@ class PageResult: async def build_page_query(local_pdf_path: str, page: int, target_longest_image_dim: int, target_anchor_text_len: int, image_rotation: int = 0) -> dict: - MAX_TOKENS = 3000 + MAX_TOKENS = 4000 assert image_rotation in [0, 90, 180, 270], "Invalid image rotation provided in build_page_query" # Allow the page rendering to process in the background while we get the anchor text (which blocks the main thread)