mirror of
https://github.com/allenai/olmocr.git
synced 2025-09-26 17:04:02 +00:00
lints
This commit is contained in:
parent
d7361c436e
commit
1270ca336a
@ -95,7 +95,7 @@ async def process_pdfs(config, pdf_directory, data_directory, repeats, force, ma
|
|||||||
is_async = asyncio.iscoroutinefunction(method)
|
is_async = asyncio.iscoroutinefunction(method)
|
||||||
|
|
||||||
# Use recursive glob to support nested PDFs
|
# Use recursive glob to support nested PDFs
|
||||||
all_pdfs = glob.glob(os.path.join(pdf_directory, '**/*.pdf'), recursive=True)
|
all_pdfs = glob.glob(os.path.join(pdf_directory, "**/*.pdf"), recursive=True)
|
||||||
all_pdfs.sort()
|
all_pdfs.sort()
|
||||||
|
|
||||||
# Prepare all tasks
|
# Prepare all tasks
|
||||||
|
@ -1,4 +1,5 @@
|
|||||||
import json
|
import json
|
||||||
|
import os
|
||||||
import re
|
import re
|
||||||
from concurrent.futures import ThreadPoolExecutor, as_completed
|
from concurrent.futures import ThreadPoolExecutor, as_completed
|
||||||
from dataclasses import asdict, dataclass
|
from dataclasses import asdict, dataclass
|
||||||
|
Loading…
x
Reference in New Issue
Block a user