mirror of
https://github.com/allenai/olmocr.git
synced 2025-10-13 09:12:18 +00:00
Fix
This commit is contained in:
parent
a4605e4efc
commit
cb4dfeba36
@ -38,6 +38,9 @@ class ValidationError(Exception):
|
||||
|
||||
|
||||
def normalize_text(md_content: str) -> str:
|
||||
if md_content is None:
|
||||
return None
|
||||
|
||||
# Normalize whitespace in the md_content
|
||||
md_content = re.sub(r"\s+", " ", md_content)
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user