mirror of
https://github.com/allenai/olmocr.git
synced 2025-10-27 16:12:13 +00:00
Repackager is still not working right
This commit is contained in:
parent
4c21e15d0e
commit
557bb9a5e9
@ -54,7 +54,7 @@ def infer_doc_id(md_path: Path, processed_root: Path) -> str:
|
|||||||
rel = md_path.relative_to(processed_root)
|
rel = md_path.relative_to(processed_root)
|
||||||
if len(rel.parts) < 2:
|
if len(rel.parts) < 2:
|
||||||
stem = rel.stem
|
stem = rel.stem
|
||||||
prefix = rel.stem[:4]
|
prefix = rel.stem
|
||||||
else:
|
else:
|
||||||
prefix = rel.parts[0]
|
prefix = rel.parts[0]
|
||||||
stem = Path(rel.parts[-1]).stem
|
stem = Path(rel.parts[-1]).stem
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user