mirror of
https://github.com/allenai/olmocr.git
synced 2025-09-26 08:54:01 +00:00
lints
This commit is contained in:
parent
d7361c436e
commit
1270ca336a
@ -95,7 +95,7 @@ async def process_pdfs(config, pdf_directory, data_directory, repeats, force, ma
|
|||||||
is_async = asyncio.iscoroutinefunction(method)
|
is_async = asyncio.iscoroutinefunction(method)
|
||||||
|
|
||||||
# Use recursive glob to support nested PDFs
|
# Use recursive glob to support nested PDFs
|
||||||
all_pdfs = glob.glob(os.path.join(pdf_directory, '**/*.pdf'), recursive=True)
|
all_pdfs = glob.glob(os.path.join(pdf_directory, "**/*.pdf"), recursive=True)
|
||||||
all_pdfs.sort()
|
all_pdfs.sort()
|
||||||
|
|
||||||
# Prepare all tasks
|
# Prepare all tasks
|
||||||
@ -160,8 +160,8 @@ if __name__ == "__main__":
|
|||||||
"methods",
|
"methods",
|
||||||
nargs="+",
|
nargs="+",
|
||||||
help="Methods to run in the format method[:key=value ...]. "
|
help="Methods to run in the format method[:key=value ...]. "
|
||||||
"Example: gotocr mineru:temperature=2 marker:u=3. "
|
"Example: gotocr mineru:temperature=2 marker:u=3. "
|
||||||
"Use 'name=folder_name' to specify a custom output folder name.",
|
"Use 'name=folder_name' to specify a custom output folder name.",
|
||||||
)
|
)
|
||||||
parser.add_argument("--repeats", type=int, default=1, help="Number of times to repeat the conversion for each PDF.")
|
parser.add_argument("--repeats", type=int, default=1, help="Number of times to repeat the conversion for each PDF.")
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
|
@ -1,4 +1,5 @@
|
|||||||
import json
|
import json
|
||||||
|
import os
|
||||||
import re
|
import re
|
||||||
from concurrent.futures import ThreadPoolExecutor, as_completed
|
from concurrent.futures import ThreadPoolExecutor, as_completed
|
||||||
from dataclasses import asdict, dataclass
|
from dataclasses import asdict, dataclass
|
||||||
|
Loading…
x
Reference in New Issue
Block a user