mirror of
https://github.com/allenai/olmocr.git
synced 2025-09-26 17:04:02 +00:00
lints
This commit is contained in:
parent
d7361c436e
commit
1270ca336a
@ -95,7 +95,7 @@ async def process_pdfs(config, pdf_directory, data_directory, repeats, force, ma
|
||||
is_async = asyncio.iscoroutinefunction(method)
|
||||
|
||||
# Use recursive glob to support nested PDFs
|
||||
all_pdfs = glob.glob(os.path.join(pdf_directory, '**/*.pdf'), recursive=True)
|
||||
all_pdfs = glob.glob(os.path.join(pdf_directory, "**/*.pdf"), recursive=True)
|
||||
all_pdfs.sort()
|
||||
|
||||
# Prepare all tasks
|
||||
@ -160,8 +160,8 @@ if __name__ == "__main__":
|
||||
"methods",
|
||||
nargs="+",
|
||||
help="Methods to run in the format method[:key=value ...]. "
|
||||
"Example: gotocr mineru:temperature=2 marker:u=3. "
|
||||
"Use 'name=folder_name' to specify a custom output folder name.",
|
||||
"Example: gotocr mineru:temperature=2 marker:u=3. "
|
||||
"Use 'name=folder_name' to specify a custom output folder name.",
|
||||
)
|
||||
parser.add_argument("--repeats", type=int, default=1, help="Number of times to repeat the conversion for each PDF.")
|
||||
parser.add_argument(
|
||||
|
@ -1,4 +1,5 @@
|
||||
import json
|
||||
import os
|
||||
import re
|
||||
from concurrent.futures import ThreadPoolExecutor, as_completed
|
||||
from dataclasses import asdict, dataclass
|
||||
|
Loading…
x
Reference in New Issue
Block a user